# TO DO
# - Framework for quantifying the effects of within- and across-population variation in thermal limits to spatial patterns in vulnerability to warming. Comparing predictions based on 1) median, 2) overall CTmax vs. temp regression, 3) population variation in intercepts, 4) population variation in both slope and intercept. The end metric I could use to compare across scenarios is i) the cumulative amount of underestimation (summed across populations) or ii) the number of sites that have overestimated WT, or iii) the slope of WT (local adaptation and seasonal acclimation should result in more shallow slopes).
Site Characteristics
site_temps = full_data %>%
dplyr::select(site, lat, season, doy, collection_temp, collection_salinity) %>%
distinct() %>%
filter(doy > 100)
Copepods were collected by surface tow from sites across the Western
Atlantic at several times throughout the year. The sites are shown
below. Temperatures at the time of collection were measured using a
manual thermometer. Across the entire set of collections, temperature
ranged from 10°C to 36°C.
coords = site_data %>%
dplyr::select(site, long, lat) %>%
distinct()
site_map = map_data("world") %>%
filter(region %in% c("USA", "Canada")) %>%
ggplot() +
geom_polygon(aes(x = long, y = lat, group = group),
fill = "lightgrey") +
coord_map(xlim = c(-85,-60),
ylim = c(25, 48)) +
geom_point(data = coords,
mapping = aes(x = long, y = lat, colour = site),
size = 3) +
scale_colour_manual(values = site_cols) +
labs(x = "Longitude",
y = "Latitude") +
theme_matt(base_size = 16)
site_temp_plot = ggplot(site_temps, aes(x = doy, y = collection_temp, colour = site)) +
geom_line(linewidth = 2) +
geom_point(size = 5) +
scale_colour_manual(values = site_cols) +
labs(y = "Temperature (°C)",
x = "Day of the Year") +
theme_matt() +
theme(legend.position = "right")
ggarrange(site_map, site_temp_plot, common.legend = T, legend = "bottom")

Collections aimed to obtain copepods near the onset of peak
temperatures, after peak temperatures, and then at low temperatures.
Regional data is not available for all sites, so here we’ve pieced
together daily temperature values from either local temperature sensors
(sites in Florida and the Chesapeake) and high resolution satellite
temperature data (Connecticut, Maine, and the Canadian sites). This
satellite data comes from the NOAA 1/4° Daily Optimum Interpolation Sea
Surface Temperature (OISST).
These temperature profiles are shown below, with the temperatures
measured during the time of collection included for comparison In
several cases collection temperature does not match the recorded daily
averages, but the temperature records do give a general sense of the
timing of seasonal maxima. In general, the first sample from each site
fell just after the site reached the warmest period. The exception to
that pattern is in Florida, where collections occurred after an extended
period of high temperatures.
temp_profiles = temp_profiles %>%
mutate(region = fct_relevel(region, "Florida", "Chesapeake", "Connecticut",
"Maine", "Shediac", "Miramichi"))
site_temps2 = site_temps %>%
mutate(region = case_when(
site == "Manatee River" ~ "Florida",
site == "Ft. Hamer" ~ "Florida",
site == "Tyler Cove" ~ "Chesapeake",
site == "Ganey's Wharf" ~ "Chesapeake",
site == "Esker Point" ~ "Connecticut",
site == "Sawyer Park" ~ "Maine",
site == "St. Thomas de Kent Wharf" ~ "Shediac",
site == "Ritchie Wharf" ~ "Miramichi"),
region = fct_relevel(region, "Florida", "Chesapeake", "Connecticut",
"Maine", "Shediac", "Miramichi"))
ggplot(temp_profiles, aes(x = doy, y = temp_c)) +
facet_wrap(region~.) +
geom_point(data = site_temps2,
aes(x = doy, y = collection_temp, colour = site),
size = 3) +
geom_line() +
scale_colour_manual(values = site_cols) +
labs(x = "Day of the Year",
y = "Mean Daily Temp. (°C)") +
theme_matt_facets() +
theme(legend.position = "none")

Exact locations for the sites are provided here.
site_data %>%
arrange(lat) %>%
select("Site" = site, "Region" = region, "Lat" = lat, "Long" = long) %>%
knitr::kable(align = "c")
| Key Largo |
Florida |
25.28391 |
-80.33014 |
| Manatee River |
Florida |
27.50561 |
-82.57277 |
| Ft. Hamer |
Florida |
27.52488 |
-82.43101 |
| Tyler Cove |
Maryland |
38.35083 |
-76.22902 |
| Ganey’s Wharf |
Maryland |
38.80555 |
-75.90906 |
| Esker Point |
Connecticut |
41.32081 |
-72.00166 |
| Sawyer Park |
Maine |
43.90698 |
-69.87179 |
| St. Thomas de Kent Wharf |
New Brunswick |
46.44761 |
-64.63692 |
| Ritchie Wharf |
New Brunswick |
47.00481 |
-65.56291 |
Nested within each of the three regions (South, Central, and Northern
regions) are pairs of low and high salinity sites:
data.frame("Region" = c("South", "Central", "North"),
"Low Salinity" = c("Ft. Hamer", "Ganey's Wharf", "Ritchie Wharf"),
"High Salinity" = c("Manatee River", "Tyler Cove", "St. Thomas de Kent Wharf")) %>%
knitr::kable(align = "c")
| South |
Ft. Hamer |
Manatee River |
| Central |
Ganey’s Wharf |
Tyler Cove |
| North |
Ritchie Wharf |
St. Thomas de Kent Wharf |
There are fairly well-established divergences between high salinity
and low salinity populations of Acartia tonsa. These sets of
geographically proximate but isolated populations provide independent
comparisons of the effects of seasonality. Shown here are the collection
conditions for these pairs of sites. Temperature was typically similar
across the pairs within each collection, while salinity differences were
fairly stable across collections.
season_cols = c("early" = "grey75",
"peak" = "grey50",
"late" = "grey25")
sal_regions = data.frame(region = rep(c("South", "Central", "North"), each = 2),
site = c("Ft. Hamer", "Manatee River",
"Ganey's Wharf", "Tyler Cove",
"Ritchie Wharf", "St. Thomas de Kent Wharf"),
salinity = c("low", "high"))
sal_comps = full_data %>%
filter(site %in% sal_regions$site) %>%
inner_join(sal_regions, by = c("site")) %>%
select( region = region.y, site, salinity, season, doy, collection_temp, collection_salinity,
size, ctmax, warming_tol) %>%
mutate(salinity = fct_relevel(salinity, "low", "high"),
region = fct_relevel(region, "South", "Central", "North"))
sal_comp_temps = sal_comps %>%
select(salinity, season, region, collection_temp, collection_salinity) %>%
distinct() %>%
ggplot(aes(x = salinity, y = collection_temp, colour = season, group = season)) +
facet_wrap(region~.) +
geom_line(linewidth = 1.5) +
geom_point(size = 4) +
scale_colour_manual(values = season_cols) +
labs(y = "Collection Temp. (°C)",
x = "") +
theme_matt_facets(base_size = 14)
sal_comp_sal = sal_comps %>%
select(salinity, season, region, collection_temp, collection_salinity) %>%
distinct() %>%
ggplot(aes(x = salinity, y = collection_salinity, colour = season, group = season)) +
facet_wrap(region~.) +
geom_line(linewidth = 1.5) +
geom_point(size = 4) +
scale_colour_manual(values = season_cols) +
labs(y = "Collection Salinity (psu)",
x = "Salinity") +
theme_matt_facets(base_size = 14)
ggarrange(sal_comp_temps, sal_comp_sal, nrow = 2, common.legend = T, legend = "right")

# sal_comps %>%
# select(site, salinity, season, region, collection_temp, collection_salinity) %>%
# distinct() %>%
# ggplot(aes(x = collection_salinity, y = collection_temp, colour = site)) +
# facet_grid(region~.) +
# geom_point(size = 4) +
# #stat_ellipse() +
# #geom_path(arrow = arrow(length = unit(0.1, "inches"), type = "closed")) +
# scale_colour_manual(values = site_cols) +
# theme_matt_facets(base_size = 14)
The latitudinal gradient covers a wide range of seasonality. Shown
below is the temperature range. While based on collection temperatures,
and therefore an underestimate of the total seasonal range of
temperatures, these patterns are representative of the expected
latitudinal gradient in seasonality.
site_temps %>%
group_by(site, lat) %>%
summarise(temp_range = max(collection_temp) - min(collection_temp)) %>%
ggplot(aes(x = lat, y = temp_range)) +
geom_point(aes(colour = site),
size = 3) +
scale_color_manual(values = site_cols) +
labs(x = "Latitude",
y = "Collection Temp. Range (°C)") +
theme_matt() +
theme(legend.position = "right")

Phenotypic Measurements
Critical Thermal Limits
A total of 456 individuals were examined. Critical thermal limits and
body size measurements were made before individuals were preserved in
ethanol. We excluded data for 7 individuals, detailed below. These
individuals had either very low CTmax or were, upon re-examination of
photographs, identified as juveniles instead of mature females. With
these individuals excluded, the full data set contains 449
phenotyped individuals.
excluded %>%
select(region, site, season, collection_temp, collection_salinity, replicate, tube, ctmax, size) %>%
knitr::kable(align = "c")
| Florida |
Manatee River |
peak |
34.0 |
29 |
2 |
6 |
38.45833 |
0.616 |
| Florida |
Manatee River |
peak |
34.0 |
29 |
2 |
7 |
38.23750 |
0.593 |
| Florida |
Ft. Hamer |
late |
20.0 |
18 |
2 |
3 |
36.59280 |
0.619 |
| Maryland |
Tyler Cove |
peak |
29.5 |
15 |
2 |
2 |
36.84375 |
0.614 |
| Connecticut |
Esker Point |
early |
22.5 |
30 |
2 |
3 |
30.02604 |
0.687 |
| Maine |
Sawyer Park |
peak |
22.0 |
30 |
1 |
4 |
30.81424 |
0.865 |
| New Brunswick |
St. Thomas de Kent Wharf |
late |
13.5 |
28 |
1 |
3 |
28.78299 |
1.039 |
Critical thermal maxima (CTmax) was measured using a custom setup.
The method uses a standard dynamic ramping assay to determine the
maximum temperature individuals could sustain normal functioning. This
differs from lethal temperatures, and indeed, all individuals observed
so far recovered following the assay.
Individuals were rested for one hour after collection before the
assay. During the assay, copepods were held in artificial seawater,
composed of bottled spring water and Instant Ocean salt mix adjusted to
match collection salinities. During the assay, several ‘control’
individuals were maintained in this solution at ambient temperatures
without the temperature ramp to ensure that there was no background
mortality. When sorting individuals from the plankton tow contents, they
were held in a 50:50 mix of 60 um filtered water from the collection
site and artificial seawater as an additional acclimation step.
Sample sizes varied slightly across experiments, but most sites had
20 individuals measured per season. The major exceptions were the early
samples from the Florida sites and the late sample from Sawyer Park
(Maine). Only two sets of samples (peak and late) were collected from
Fort Hamer and Manatee River. No samples were collected from Key Largo
for this project, as Acartia tonsa wasn’t present in the water
during the peak season, likely due to the recent extreme heat event. The
late season collection from Sawyer Park occurred after Acartia
tonsa abundance decreased. Samples from this period were dominated
by Acartia hudsonica instead.
ggplot(full_data, aes(x = site, fill = site)) +
facet_wrap(season~.) +
geom_hline(yintercept = c(0,20),
colour = "grey70") +
geom_bar() +
scale_fill_manual(values = site_cols) +
coord_flip() +
theme_matt() +
theme(legend.position = "none",
panel.border = element_rect(linewidth = 1,
fill = NA),
strip.text = element_text(size = 20),
axis.title.y = element_blank())

Shown below are the measured CTmax values. Note: CTmax values for the
early season Key Largo copepods were collected at the end of February
2023 as part of a separate project. Body size values were not measured
during this project, nor were copepods individually preserved after the
experiments. These early season CTmax values are included as a point of
comparison. Individual measurements are shown in small points for each
collection. The large points indicate the mean values for each
collection.
mean_ctmax = full_data %>%
group_by(site, season, doy, collection_temp) %>%
summarize(mean_ctmax = mean(ctmax),
median_ctmax = median(ctmax))
ggplot(full_data, aes(x = season, y = ctmax, colour = site)) +
geom_line(data = mean_ctmax,
aes(y = mean_ctmax, group = site),
position = position_dodge(width = 0.4),
linewidth = 1) +
geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
dodge.width = 0.4),
alpha = 0.3) +
geom_point(data = mean_ctmax,
aes(y = mean_ctmax),
position = position_dodge(width = 0.4),
size = 4) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax (°C)",
x = "Season") +
theme_matt() +
theme(legend.position = "right",
legend.title.align = 0.125)

CTmax data for each individual site is shown below, plotted against
day of the year.
ggplot(full_data, aes(x = doy, y = ctmax, colour = site)) +
facet_wrap(.~site, scales = "free") +
geom_line(data = mean_ctmax,
aes(y = mean_ctmax, group = site),
position = position_dodge(width = 0.4),
linewidth = 3, alpha = 0.5) +
# geom_line(data = mean_ctmax,
# aes(y = collection_temp, group = site),
# position = position_dodge(width = 0.4),
# linewidth = 2,
# colour = "grey") +
geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
dodge.width = 0.4),
alpha = 0.8) +
# geom_point(data = mean_ctmax,
# aes(y = median_ctmax),
# position = position_dodge(width = 0.4),
# size = 4) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax (°C)",
x = "Day of Year") +
theme_matt() +
theme(legend.position = "none",
legend.title.align = 0.125)

Warming tolerance
Warming tolerance (the difference between thermal limits and
environmental temperatures) is a commonly used metric of climate
vulnerability. We calculated this as the difference between measured
CTmax values and the collection temperature. Smaller warming tolerance
values indicate that populations were nearer to their upper thermal
limits, and may therefore be more vulnerable to additional warming.
mean_wt = full_data %>%
group_by(site, season) %>%
summarize(mean_wt = mean(warming_tol),
median_wt = median(warming_tol))
ggplot(full_data, aes(x = season, y = warming_tol, colour = site)) +
geom_line(data = mean_wt,
aes(y = mean_wt, group = site),
position = position_dodge(width = 0.4),
linewidth = 1) +
geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
dodge.width = 0.4),
alpha = 0.3) +
geom_point(data = mean_wt,
aes(y = mean_wt),
position = position_dodge(width = 0.4),
size = 4) +
scale_colour_manual(values = site_cols) +
labs(y = "Warming Tolerance (°C)",
x = "Season") +
theme_matt() +
theme(legend.position = "right",
legend.title.align = 0.125)

Body Size
Following the CTmax assay, individuals were photographed for body
size measurements. Prosome lengths were measured from these photographs
using a scale micrometer and the software ImageJ. These measurements are
shown below. As before, large points indicate the mean body size. While
less cohesive than CTmax, a general trend of increasing body size with
latitude and time of year can be seen.
mean_size = full_data %>%
group_by(site, season, doy, collection_temp) %>%
summarize(mean_size = mean(size),
median_size = median(size))
ggplot(full_data, aes(x = season, y = size, colour = site)) +
geom_line(data = mean_size,
aes(y = mean_size, group = site),
position = position_dodge(width = 0.4),
linewidth = 1) +
geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
dodge.width = 0.4),
alpha = 0.3) +
geom_point(data = mean_size,
aes(y = mean_size),
position = position_dodge(width = 0.4),
size = 4) +
scale_colour_manual(values = site_cols) +
labs(y = "Prosome Length (mm)",
x = "Season") +
theme_matt() +
theme(legend.position = "right",
legend.title.align = 0.125)

Shown below is the body size data for each individual site.
ggplot(drop_na(full_data, size), aes(x = doy, y = size, colour = site)) +
facet_wrap(.~site) +
geom_line(data = drop_na(mean_size, mean_size),
aes(y = mean_size, group = site),
position = position_dodge(width = 0.4),
linewidth = 3, alpha = 0.5) +
geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
dodge.width = 0.4),
alpha = 0.8) +
# geom_point(data = mean_ctmax,
# aes(y = median_ctmax),
# position = position_dodge(width = 0.4),
# size = 4) +
scale_colour_manual(values = site_cols) +
labs(y = "Prosome Length (mm)",
x = "Day of Year") +
theme_matt() +
theme(legend.position = "none",
legend.title.align = 0.125)

Salinity Pair Comparisons
The three pairs of cross-salinity comparisons do show evidence for
fine-scale trait divergence, although there was no consistent pattern in
the direction or magnitude of differences. CTmax was similar across
sites in the Southern and Central pairs. In the Northern pair, CTmax
tended to be slightly lower for individuals from the low salinity site.
Size was more variable between the paired sites. In the South, low
salinity individuals were consistently smaller than high salinity
individuals, despite the similar temperatures. In the Central pair,
individuals from the low salinity site tended to be slightly larger than
those from the high salinity site, although this varied seasonally.
Sizes tended to be more similar across the collections from the Northern
pair.
sal_comp_ctmax_plot = sal_comps %>%
ggplot(aes(x = salinity, y = ctmax, colour = season, group = season)) +
facet_wrap(region~.) +
geom_point(size = 2,
position = position_dodge(width = 0.2)) +
#geom_line(size = 1.5) +
scale_colour_manual(values = season_cols) +
labs(y = "CTmax (°C)",
x = "") +
theme_matt_facets(base_size = 14)
sal_comp_size_plot = sal_comps %>%
ggplot(aes(x = salinity, y = size, colour = season, group = season)) +
facet_wrap(region~.) +
geom_point(size = 2,
position = position_dodge(width = 0.2)) +
#geom_line(size = 1.5) +
scale_colour_manual(values = season_cols) +
labs(y = "Prosome Length (mm)",
x = "") +
theme_matt_facets(base_size = 14)
ggarrange(sal_comp_ctmax_plot, sal_comp_size_plot, nrow = 2, common.legend = T, legend = "right")

###
sal_comp_ctmax.model = lm(ctmax ~ collection_temp, data = sal_comps)
# summary(ctmax_temp.model)
# car::Anova(ctmax_temp.model)
sal_comp_ctmax_resids = residuals(sal_comp_ctmax.model)
sal_comp_size.model = lm(size ~ collection_temp, data = sal_comps)
# summary(size_temp.model)
# car::Anova(size_temp.model)
sal_comp_size_resids = residuals(sal_comp_size.model)
sal_comp_ctmax_resid_plot = sal_comps %>%
mutate(ctmax_resids = sal_comp_ctmax_resids,
size_resids = sal_comp_size_resids) %>%
ggplot(aes(x = salinity, y = ctmax_resids, colour = season, group = season)) +
facet_wrap(region~.) +
geom_point(size = 2,
position = position_dodge(width = 0.5)) +
#geom_line(size = 1.5) +
scale_colour_manual(values = season_cols) +
labs(y = "CTmax \nResiduals",
x = "") +
theme_matt_facets(base_size = 14)
sal_comp_size_resid_plot = sal_comps %>%
mutate(ctmax_resids = sal_comp_ctmax_resids,
size_resids = sal_comp_size_resids) %>%
ggplot(aes(x = salinity, y = size_resids, colour = season, group = season)) +
facet_wrap(region~.) +
geom_point(size = 2,
position = position_dodge(width = 0.5)) +
#geom_line(size = 1.5) +
scale_colour_manual(values = season_cols) +
labs(y = "Prosome Length \nResiduals",
x = "") +
theme_matt_facets(base_size = 14)
#ggarrange(sal_comp_ctmax_resid_plot, sal_comp_size_resid_plot, nrow = 2, common.legend = T, legend = "right")
Trait Correlations
Regardless of the underlying mechanism (genetic differentiation or
phenotypic plasticity), we expect that collections from warmer waters
should yield copepods with higher thermal limits and smaller body sizes.
Our observations largely fit this expectation, with strong increases in
CTmax at higher temperatures, and a general decrease in prosome lengths
as temperature increased.
ctmax_temp_plot = ggplot(full_data, aes(x = collection_temp, y = ctmax)) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax (°C)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "none")
size_temp_plot = ggplot(full_data, aes(x = collection_temp, y = size)) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "Prosome Length (mm)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
wt_temp_plot = ggplot(full_data, aes(x = collection_temp, y = warming_tol)) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "Warming Tolerance (°C)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
ggarrange(ctmax_temp_plot, wt_temp_plot, size_temp_plot, common.legend = T, legend = "bottom", nrow = 1)

Shown below are these temperature correlations for each individual
population. Variation in the temperature sensitivity of these traits
appears to vary across populations, with reduced slopes in both the
lowest and the highest latitude populations. Again, we emphasize that
this observed trait variation may stem from either (or both) plastic and
genetic effects. However, these observations provide estimates for
realistic patterns in temperature sensitivity for these populations.
ggplot(full_data, aes(x = collection_temp, y = ctmax)) +
facet_wrap(.~site) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax (°C)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "none")

ggplot(full_data, aes(x = collection_temp, y = size)) +
facet_wrap(.~site) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "Prosome Length (mm)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "none")

One additional correlation of interest is the relationship between
prosome length and CTmax. In many cases, larger body sizes are
associated with cold adaptation/acclimation, and there is a general
trend of decreasing thermal limits with increasing size. Shown below is
the relationship between prosome length and CTmax in our data set.
Individual regression lines for each site are also included - the dark
grey lines in the background represent the ‘universal’ regression for
that site, with individual colored regression lines for each collection.
Across our collections, we see evidence for this relationship, with
larger individuals having lower thermal limits.
universal_size = full_data %>%
ggplot(aes(x = size, y = ctmax)) +
# geom_smooth(data = filter(full_data, ctmax > 31),
# aes(x = size, y = ctmax),
# method = "lm",
# colour = "grey60",
# se = F,
# linewidth = 2) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey70") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax (°C)",
x = "") +
theme_matt(base_size = 14) +
theme(legend.position = "right",
axis.title.x = element_blank())
pop_size = full_data %>%
ggplot(aes(x = size, y = ctmax, colour = site, group = season)) +
facet_wrap(site~.) +
# geom_smooth(data = filter(full_data, ctmax > 31),
# aes(x = size, y = ctmax),
# method = "lm",
# colour = "grey60",
# se = F,
# linewidth = 2) +
geom_smooth(data = full_data,
aes(x = size, y = ctmax, group = site),
colour = "grey20", method = "lm", se = F) +
geom_point(size = 1.3, alpha = 0.3) +
geom_smooth(method = "lm", se = F,
linewidth = 1) +
scale_colour_manual(values = site_cols) +
scale_x_continuous(breaks = c(0.6, 0.8, 1)) +
labs(y = "CTmax (°C)",
x = "Prosome Length (mm)") +
theme_matt(base_size = 14) +
theme(legend.position = "right")
ggarrange(universal_size, pop_size, common.legend = T, legend = "none", nrow = 2)

This relationship may be affected by changes in temperature at each
site, however, which may affect both body size and thermal limits. If
there is a true mechanistic relationship between body size and thermal
limits, we would expect to see this relationship emerge
within populations or even individual collections.
Shown below is the relationship between CTmax and size residuals,
acquired from regressions of these traits against collection
temperature. This substantially reduces the strength of the apparent
relationship, but there is still a slightly negative overall
relationship, spanning both across-population, within-population, and
even within-collection scales (see the Sawyer Park collections, for
example).
filtered_data = full_data %>%
drop_na(size, ctmax) %>%
mutate(temp_cent = scale(collection_temp, scale = F),
sal_cent = scale(collection_salinity, scale = F),
sal_type = if_else(collection_salinity > 20, "High", "Low"))
ctmax_temp.model = lm(ctmax ~ collection_temp + site, data = filtered_data)
ctmax_resids = residuals(ctmax_temp.model)
size_temp.model = lm(size ~ collection_temp + site, data = filtered_data)
size_resids = residuals(size_temp.model)
universal_resids = filtered_data %>%
mutate(ctmax_resids = ctmax_resids,
size_resids = size_resids)
all_resids = ggplot(universal_resids, aes(x = size_resids, y = ctmax_resids)) +
# geom_smooth(data = filter(full_data, ctmax > 31),
# aes(x = size, y = ctmax),
# method = "lm",
# colour = "grey60",
# se = F,
# linewidth = 2) +
geom_smooth(method = "lm", se = T,
linewidth = 2,
colour = "grey70") +
geom_point(aes(colour = site),
size = 2, alpha = 0.7) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Residuals",
x = "") +
theme_matt(base_size = 14) +
theme(legend.position = "right",
axis.title.x = element_blank())
pop_resids = ggplot(universal_resids, aes(x = size_resids, y = ctmax_resids, colour = site, group = season)) +
facet_wrap(site~.) +
# geom_smooth(data = filter(full_data, ctmax > 31),
# aes(x = size, y = ctmax),
# method = "lm",
# colour = "grey60",
# se = F,
# linewidth = 2) +
geom_smooth(aes(x = size_resids, y = ctmax_resids, group = site),
colour = "grey20", method = "lm", se = F) +
geom_point(size = 1.3, alpha = 0.3) +
geom_smooth(method = "lm", se = F,
linewidth = 1) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Residuals",
x = "Prosome Length Residuals") +
theme_matt(base_size = 14) +
theme(legend.position = "right")
ggarrange(all_resids, pop_resids, common.legend = T, legend = "none", nrow = 2)

To more formally test the relationships between CTmax, collection
temperature, and size, we used a linear mixed effects model, structured
as
ctmax ~ collection_temp + size + salinity_type + (1|site).
This examines the effects of temperature and size on CTmax, along with
differences between the salinity groupings. Collection temperature was
centered and salinity type assigned (“low” salinity as anything below 20
psu, “high” salinity as anything above 20 psu) before model fitting. The
model also includes random intercepts for each site and random slopes
for collection temperature (i.e. - variation in the acclimation capacity
of CTmax).
Collection temperature and body size both had a significant effect on
CTmax, but salinity type did not. The overall effect of temperature
suggests an increase in CTmax of 0.2°C per °C increase in collection
temperature (i.e. - an ARR value of 0.2), while increasing body sizes
decrease CTmax by -3.15°C per mm (or a decrease of ~-0.315°C per tenth
of a mm, which is more biologically realistic for A. tonsa).
While not significant, the model suggests low salinity sites had lower
thermal limits by ~1°C.
#summary(ctmax.model)
effects_summary = data.frame(
"Temperature" = unname(fixef(ctmax.model)["temp_cent"]),
"Size" = unname(fixef(ctmax.model)["size"]),
"Salinity" = unname(fixef(ctmax.model)["sal_typeLow"]))
knitr::kable(effects_summary)
| 0.195262 |
-3.153573 |
-1.041622 |
By extracting the conditional mode for the random effects, we can
also examine how thermal limits vary across sites beyond the influence
of collection temperatures and body sizes. Shown below are these values,
extracted from the linear mixed effects model. We can see that, similar
to what’s been observed in common garden experiments with A.
tonsa previously, significant divergences are present at only a few
sites, with Fort Hamer and Ritchie Wharf having increased and decreased
thermal limits respectively. Interestingly, both of these sites were low
salinity sites, also in line with previous results suggesting gene flow
between high salinity sites may constrain differentiation.
pop_effs = REsim(ctmax.model) %>%
dplyr::select("site" = groupID, term, mean, sd) %>%
filter(term == "(Intercept)") %>%
inner_join(site_data, by = c("site")) %>%
mutate(site = fct_reorder(site, lat))
#plotREsim(REsim(ctmax.model)) # plot the interval estimates
ggplot(pop_effs, aes(x = lat, y = mean, colour = site)) +
geom_hline(yintercept = 0) +
geom_errorbar(aes(ymin = mean - 1.96 * sd, ymax = mean + 1.96 * sd),
width = 0.5, linewidth = 1) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(x = "Latitude",
y = "Population Effect") +
theme_matt() +
theme(legend.position = "right")

Finally, shown below are the estimated random slopes for each site.
These represent the effects of collection temperature on CTmax for each
site. Interestingly, these estimates diverge from the results of
previous common garden experiments, which showed the strongest
plasticity in high latitude sites. Here, acclimation appears to peak in
mid-latitudes, and decrease at both high and low latitude sites.
coefficients(ctmax.model)$site %>%
janitor::clean_names() %>%
rownames_to_column(var = "site") %>%
inner_join(site_data) %>%
mutate(site = fct_reorder(site, lat)) %>%
ggplot(aes(x = temp_cent, y = site)) +
geom_point(aes(colour = site),
size = 5) +
scale_colour_manual(values = site_cols) +
labs(x = "ARR") +
theme_matt() +
theme(legend.position = "none",
axis.title.y = element_blank())

Trait Variability
Shown below is the trait variation (ranges) for each site. Ranges are
calculated for each collection separately.
trait_ranges = full_data %>%
group_by(site, season, collection_temp, collection_salinity, doy, lat) %>%
summarise(mean_ctmax = mean(ctmax),
ctmax_range = max(ctmax) - min(ctmax),
ctmax_var = var(ctmax),
mean_size = mean(size),
size_range = max(size) - min(size),
size_var = var(size)) %>%
mutate(prop_ctmax_range = ctmax_range / mean_ctmax,
prop_size_range = size_range / mean_size)
ctmax_range_temp = ggplot(trait_ranges, aes(x = collection_temp, y = ctmax_range, colour = site)) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Range (°C)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
ctmax_var_temp = ggplot(trait_ranges, aes(x = collection_temp, y = ctmax_var, colour = site)) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Range (°C)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
size_range_temp = ggplot(trait_ranges, aes(x = collection_temp, y = size_range, colour = site)) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "Size Range (mm)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
size_var_temp = ggplot(trait_ranges, aes(x = collection_temp, y = size_var, colour = site)) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "Size Range (mm)",
x = "Collection Temp. (°C)") +
theme_matt() +
theme(legend.position = "right")
ggarrange(ctmax_range_temp, size_range_temp, common.legend = T, legend = "right")

Changes in trait variance may be indicative of phenotypic selection.
If selection (as opposed to acclimation) are driving seasonal changes,
we may expect to see a reduction in variance in the peak samples
relative to the early season samples. Note that early season collection
temperatures this year were higher than expected, driven by fairly
strong heatwaves across the North Atlantic. As shown in the temperature
profiles for each site, the ‘early’ samples were collected just after
high temperatures were reached, while ‘peak’ samples were collected
after sites had experienced high temperatures for several weeks
(generations). As warming tolerances were fairly high throughout this
period, we will assume that selection was weak before the early samples.
If the early onset of high temperatures filtered out vulnerable
genotypes prior to our sampling, the results will be a conservative
estimate of the effects of selection on trait variance.
Shown below is the seasonal progression of variance in CTmax for each
site. For many sites, variance decreased between the early and peak
samples, and then increased again in the late sample. For some sites
(e.g. Esker Point), this increase in the late sample was
substantial.
ggplot(trait_ranges, aes(x = season, y = ctmax_var, colour = site)) +
geom_line(aes(group = site),
linewidth = 1.5) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Variance",
x = "Season") +
theme_matt() +
theme(legend.position = "right",
legend.title.align = 0.125)

Shown below is the seasonal progression of variance in body size. A
similar pattern of decreasing variance in peak samples relative to early
and late samples is again seen for many sites. The obvious exception is
the Esker Point sample, which saw the opposite trend.
ggplot(trait_ranges, aes(x = season, y = size_var, colour = site)) +
geom_line(aes(group = site),
linewidth = 1.5) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Variance",
x = "Season") +
theme_matt() +
theme(legend.position = "right",
legend.title.align = 0.125)

Shown below are the seasonal changes in trait variance for each site
individually.
ggplot(trait_ranges, aes(x = season, y = ctmax_var, colour = site)) +
facet_wrap(site~.) +
geom_line(aes(group = site),
linewidth = 1.5) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Variance",
x = "Season") +
theme_matt() +
theme(legend.position = "none",
legend.title.align = 0.125)

ggplot(trait_ranges, aes(x = season, y = size_var, colour = site)) +
facet_wrap(site~.) +
geom_line(aes(group = site),
linewidth = 1.5) +
geom_point(size = 3) +
scale_colour_manual(values = site_cols) +
labs(y = "CTmax Variance",
x = "Season") +
theme_matt() +
theme(legend.position = "none",
legend.title.align = 0.125)

Comparing rates of change
Both CTmax and body size varied between sites and across seasons. It
can be difficult to directly compare these two traits. We take two
approaches to ease this comparison. Shown below is a comparison of the
slopes from the trait regressions against collection temperature for
each population, standardized by the standard deviation of the trait for
each population (across all collections). This presents change per
degree change in collection temperature in units of standard deviations
for both CTmax and body size.
adj_slopes = full_data %>%
group_by(site, lat) %>%
arrange(doy) %>%
filter(site != "Key Largo") %>%
summarize("ctmax_slope" = coef(lm(ctmax ~ collection_temp))["collection_temp"],
"mean_ctmax" = mean(ctmax),
"ctmax_sd" = sd(ctmax),
"size_slope" = coef(lm(size ~ collection_temp))["collection_temp"],
"mean_size" = mean(size),
"size_sd" = sd(size),
"temp_range" = max(collection_temp) - min(collection_temp)) %>%
drop_na() %>%
mutate(adj_ctmax_slope = ctmax_slope / ctmax_sd,
adj_size_slope = size_slope / size_sd) %>%
pivot_longer(cols = contains("_slope"),
names_to = "slope_type",
values_to = "slope")
# ggplot(adj_slopes, aes(x = lat, y = temp_range)) +
# geom_point() +
# theme_matt()
ggplot(filter(adj_slopes, str_detect(slope_type, "adj_")), aes(x = slope_type, y = abs(slope),
group = site, colour = site)) +
geom_hline(yintercept = 0) +
geom_line(linewidth = 1) +
scale_colour_manual(values = site_cols) +
labs(x = "",
y = "Slope (absolute value)") +
theme_matt() +
theme(legend.position = "right",
axis.text.x = element_text(angle = 300, hjust = 0, vjust = 0.5))

Haldanes are a similar unit, representing change in units of standard
deviations per generation. This can be a useful metric for comparing
across traits, especially as the number of generations covered by our
sampling period likely varies across populations. The calculation of
haldanes is taken from Hendry and Kinnison (1999), which in turn is
based on work from Gingerich (1993). We estimated the number of
generations passed between collections using the empirical relationship
between temperature and development time for Acartia tonsa from
Leandro et al. (2006). For initial estimates, we used a temperature
halfway between what was observed during collection, although this
estimate can be improved by using non-linear averaging to account for
Jenzen’s Inequality and the effect of temperature variation on rate
functions. Changes were examined for each pair of collections (early to
peak, and peak to late).
Shown below is a comparison of the estimated haldane values for CTmax
and body size, separated by season. Keep in mind that while this metric
accounts for differences in the number of generations between
collections, it does not directly account for differences in
temperature, leading to inflated values in the “peak to late”
comparisons, which typically covered a larger range of temperatures.
early_peak = full_data %>%
filter(season %in% c("early", "peak")) %>%
mutate(season = if_else(season == "early", "one", "two")) %>%
group_by(site) %>%
mutate(ctmax_sd_p = sd(ctmax),
size_sd_p = sd(size),
temp_change = max(collection_temp) - min(collection_temp),
avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
days_passed = max(doy) - min(doy)) %>%
select(site, lat, season,
ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed,
ctmax, size) %>%
group_by(site, lat, season,
ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed) %>%
summarize(ctmax = mean(ctmax),
size = mean(size)) %>%
pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed),
names_from = season,
values_from = c(ctmax, size)) %>%
mutate(season = "early_to_peak") %>%
drop_na()
peak_late = full_data %>%
filter(season %in% c("peak", "late")) %>%
mutate(season = if_else(season == "peak", "one", "two")) %>%
group_by(site) %>%
mutate(ctmax_sd_p = sd(ctmax),
size_sd_p = sd(size),
temp_change = last(collection_temp) - first(collection_temp),
avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
days_passed = max(doy) - min(doy)) %>%
select(site, lat, season, ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed,
ctmax, size) %>%
group_by(site, lat, season, ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed) %>%
summarize(ctmax = mean(ctmax),
size = mean(size)) %>%
pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p,
temp_change, avg_temp, days_passed),
names_from = season,
values_from = c(ctmax, size)) %>%
mutate(season = "peak_to_late") %>%
drop_na()
calc_halds = function(x1, x2, sd_p, g){
((x2 / sd_p) - (x1 / sd_p)) / g
}
haldanes = bind_rows(early_peak, peak_late) %>%
mutate("gen_time" = 5490*(avg_temp + 1)^-2.05,
"gens" = floor(days_passed / gen_time),
"ctmax_haldanes" = calc_halds(x2 = ctmax_two, x1 = ctmax_one,
sd_p = ctmax_sd_p, g = gens),
"size_haldanes" = calc_halds(x2 = size_two, x1 = size_one,
sd_p = size_sd_p, g = gens))
# haldanes %>%
# ungroup() %>%
# select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%
# pivot_longer(cols = c(ctmax_haldanes, size_haldanes),
# names_to = c("type", NA),
# names_sep = "_",
# values_to = "haldanes") %>%
# ggplot(aes(x = type, y = haldanes, group = site, colour = site)) +
# facet_wrap(season~.) +
# geom_hline(yintercept = 0) +
# geom_line(aes(linewidth = desc(temp_change))) +
# scale_colour_manual(values = site_cols) +
# labs(x = "Trait",
# y = "Haldanes",
# linewidth = "Temp. Change") +
# theme_matt_facets()
ctmax_halds_plot = haldanes %>%
ungroup() %>%
select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%
ggplot(aes(x = season, y = ctmax_haldanes, colour = site, group = site)) +
geom_hline(yintercept = 0, colour = "grey70") +
geom_line(linewidth = 2) +
scale_colour_manual(values = site_cols) +
labs(x = "Season",
y = "Haldanes") +
ggtitle("CTmax") +
theme_matt() +
theme(legend.position = "right")
size_halds_plot = haldanes %>%
ungroup() %>%
select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%
ggplot(aes(x = season, y = size_haldanes, colour = site, group = site)) +
geom_hline(yintercept = 0, colour = "grey70") +
geom_line(linewidth = 2) +
scale_colour_manual(values = site_cols) +
labs(x = "Season",
y = "Haldanes") +
ggtitle("Size") +
theme_matt() +
theme(legend.position = "right")
ggarrange(ctmax_halds_plot, size_halds_plot, common.legend = T, legend = "bottom")

Why does intraspecific data matter?
Thermal limits vary substantially across both spatial and temporal
scales in this species, highlighting the importance of considering both
intraspecific and temporal variation in thermal limits for predictions
of vulnerability to climate change. Single point estimates of thermal
limits (as commonly used in larger, general analyses across taxa)
obscure this crucial variation, and may bias our estimates of spatial
patterns in vulnerability. Here we explore three separate scenarios to
illustrate and quantify the importance of this intraspecific
vulnerability.
Scenario 1 - Invariant thermal limits
The first scenario assumes that thermal limits are constant across
both spatial and temporal axes (i.e. a single point estimate of the
thermal limit for this species). Here we selected a central population
(the high salinity Chesapeake Bay site), and used the average thermal
limit from the peak season sample as our ‘representative’ thermal limit.
This approach is similar to that used in Bennet et al. to compile the
GlobTherm dataset. These thermal limits are used to re-estimate warming
tolerance for each collection (mean thermal limit - collection
temperature). We then compared this predicted warming tolerance with the
actual observed warming tolerances from each collection. A positive
difference indicates an overestimated warming tolerance (the population
is actually closer to their thermal limits than would be predicted from
the estimated value, and therefore more vulnerable). A negative
difference indicates an underestimated warming tolerance (the population
is further from their thermal limit than would be predicted, and
therefore less vulnerable).
Both overestimates and underestimates can be problematic for accurate
management and conservation strategies. We summarize each of the
scenarios using 1) the number of populations with a difference between
estimates >2°C in either direction, 2) the average magnitude of
difference for that subset of populations, and 3) the slope of the
difference against latitude. Effective estimation strategies will have a
small number of populations with under- or over-estimated warming
tolerance, a small magnitude difference between predicted and observed
warming tolerance, and a shallow latitudinal slope.
In this first scenario (single point estimate of thermal limits), the
effectiveness of the estimate varied across latitude and across seasons.
During the early season, thermal limits from the central site were a
decent predictor of warming tolerance at the other sites, and there was
only a slight latitudinal trend. This latitudinal trend increased,
however, during the peak and late season collections, driven by
increasingly large differences in the northern sites (indicating
increased vulnerability relative to predictions in these sites). During
the peak season collection, warming tolerance in the southern sites was
underestimated by several degrees (these populations were less
vulnerable than predicted by the central site thermal limits).
# Compare estimated warming tolerance "ranges" when: 1) CTmax for "average" collection is used; 2) When CTmax for one collection per population is used; and 3) When all collections are used. The idea is to show that not accounting for intra-specific and intra-population variation leads to incorrect predictions of vulnerability to warming because this variation can be substantial - across populations within each seasonal collection, there is at least 5°C variation in thermal limits, while across collections within populations, acclimation to changes in temperature can drive substantial variation.
## Scenario 1 - single point estimates
est_1 = full_data %>%
group_by(site, season) %>%
summarise("mean_ctmax" = mean(ctmax)) %>%
filter(site == "Tyler Cove", season == "peak")
scenario_1 = full_data %>%
mutate(rep_ctmax = est_1$mean_ctmax,
pred_wt = rep_ctmax - collection_temp,
wt_diff = pred_wt - warming_tol)
ggplot(scenario_1, aes(x = lat, y = wt_diff)) +
facet_wrap(season~., nrow = 3) +
geom_hline(yintercept = 0) +
geom_smooth(method = "lm") +
geom_point() +
labs(x = "Latitude",
y = "Predicted - Observed WT") +
theme_matt_facets()

lat.model1 = lm(data = scenario_1,
wt_diff ~ lat*season)
lat_slope_1 = emmeans::emtrends(lat.model1, var = "lat", specs = "season") %>%
as.data.frame() %>%
select(season, lat.trend)
performance_1 = scenario_1 %>%
select(site, lat, season, wt_diff) %>%
group_by(site, season, lat) %>%
summarise("mean_diff" = mean(wt_diff),
"abs_diff" = abs(mean_diff)) %>%
ungroup() %>%
mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>%
filter(flag == "yes") %>%
group_by(season) %>%
summarise("avg_diff" = mean(abs_diff),
"n" = n()) %>%
inner_join(lat_slope_1, by = "season")
Scenario 2 - Seasonally invariant thermal limits
Local adaptation of thermal limits is widely observed across a range
of taxa, including Acartia tonsa. In the second scenario, we
account for this by using average thermal limits from the peak season
for each population in the estimates of warming tolerance throughout the
year.
Unsurprisingly, this approach eliminates the latitudinal trend.
Instead we see that peak season estimates were generally decent
predictors of warming tolerance during the early season (although there
were slight overestimates in several populations), and slightly
underestimated warming tolerance during the late season.
est_2 = full_data %>%
group_by(site, season) %>%
summarise("mean_ctmax" = mean(ctmax)) %>%
filter(season == "peak") %>%
select(site, mean_ctmax)
scenario_2 = full_data %>%
inner_join(est_2, by = c("site")) %>%
mutate(pred_wt = mean_ctmax - collection_temp,
wt_diff = pred_wt - warming_tol)
ggplot(scenario_2, aes(x = lat, y = wt_diff)) +
facet_wrap(season~., nrow = 3) +
geom_hline(yintercept = 0) +
geom_smooth(method = "lm") +
geom_point() +
labs(x = "Latitude",
y = "Predicted - Observed WT") +
theme_matt_facets()

lat.model2 = lm(data = scenario_2,
wt_diff ~ lat*season)
lat_slope_2 = emmeans::emtrends(lat.model2, var = "lat", specs = "season") %>%
as.data.frame() %>%
select(season, lat.trend)
performance_2 = scenario_2 %>%
select(site, lat, season, wt_diff) %>%
group_by(site, season, lat) %>%
summarise("mean_diff" = mean(wt_diff),
"abs_diff" = abs(mean_diff)) %>%
ungroup() %>%
mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>%
filter(flag == "yes") %>%
group_by(season) %>%
summarise("avg_diff" = mean(abs_diff),
"n" = n()) %>%
inner_join(lat_slope_2, by = c("season"))
Scenario 3 - Population sub-sampling
Both of the previous approaches to estimating warming tolerance
result in overestimates of warming tolerance. These reductive methods
increase the feasibility, but are unable to account for the co-occuring
shifts in ambient temperature and thermal limits. Continuous in-situ
monitoring of thermal limits is impractical, however, especially for
species with small popuation sizes and/or very large range
distributions. One potential compromise solution is to sub-sample
populations and use observed data to predict spatial and seasonal
changes in warming tolerance.
In this third approach, we randomly selected nine collections, fit a
linear model of CTmax ~ collection temperature, and used this regression
to predict thermal limits and warming tolerance across the full set of
collections. These predicted warming tolerance values were then compared
against observed warming tolerance as before. We repeated this process
100 times (100 random sets of 9 collections) to examine the sensitivity
of this approach the populations and seasons collected. In addition to
this random data, we also included a scenario where all seasonal
collections from Ft. Hamer, Tyler Cove, and Miramichi (the latitudinal
extremes and a central point) were used to predict thermal limits.
scenario_3 = data.frame()
performance_3 = data.frame()
for(i in 1:100){
est_3 = full_data %>%
group_by(site, season, collection_temp) %>%
summarise("mean_ctmax" = mean(ctmax), .groups = "keep") %>%
ungroup() %>%
filter(row_number() %in% sample(c(1:max(row_number())), size = 9, replace = F))
rep.model = lm(data = est_3, mean_ctmax ~ collection_temp)
rep_data = full_data %>%
group_by(site, season) %>%
mutate(mean_wt = mean(warming_tol)) %>%
select(site, season, collection_temp, lat, mean_wt) %>%
ungroup() %>%
distinct() %>%
mutate(pred_ctmax = predict(rep.model, newdata = .),
pred_wt = pred_ctmax - collection_temp,
wt_diff = pred_wt - mean_wt,
run = i,
group = "random")
scenario_3 = bind_rows(scenario_3, rep_data)
lat.model3 = lm(data = scenario_3,
wt_diff ~ lat*season)
lat_slope_3 = emmeans::emtrends(lat.model3, var = "lat", specs = "season") %>%
as.data.frame() %>%
select(season, lat.trend)
rep_performance = scenario_3 %>%
select(site, lat, season, wt_diff) %>%
group_by(site, season, lat) %>%
summarise("mean_diff" = mean(wt_diff),
"abs_diff" = abs(mean_diff),
.groups = "keep") %>%
ungroup() %>%
mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>%
filter(flag == "yes") %>%
group_by(season) %>%
summarise("avg_diff" = mean(abs_diff),
"n" = n(),
.groups = "keep") %>%
inner_join(lat_slope_3, by = c("season"))
performance_3 = bind_rows(performance_3, rep_performance)
}
gold_stand = full_data %>%
group_by(site, season, collection_temp) %>%
summarise("mean_ctmax" = mean(ctmax), .groups = "keep") %>%
ungroup() %>%
filter(site %in% c("Ft. Hamer", "Tyler Cove", "Miramichi"))
gold.model = lm(data = gold_stand, mean_ctmax ~ collection_temp)
gold_data = full_data %>%
group_by(site, season) %>%
mutate(mean_wt = mean(warming_tol)) %>%
select(site, season, collection_temp, lat, mean_wt) %>%
ungroup() %>%
distinct() %>%
mutate(pred_ctmax = predict(gold.model, newdata = .),
pred_wt = pred_ctmax - collection_temp,
wt_diff = pred_wt - mean_wt,
run = i + 1,
group = "gold")
gold.model = lm(data = gold_data,
wt_diff ~ lat*season)
gold_slope = emmeans::emtrends(gold.model, var = "lat", specs = "season") %>%
as.data.frame() %>%
select(season, lat.trend)
gold_performance = gold_data %>%
select(site, lat, season, wt_diff) %>%
group_by(site, season, lat) %>%
summarise("mean_diff" = mean(wt_diff),
"abs_diff" = abs(mean_diff),
.groups = "keep") %>%
ungroup() %>%
mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>%
filter(flag == "yes") %>%
group_by(season) %>%
summarise("avg_diff" = mean(abs_diff),
"n" = n(),
.groups = "keep") %>%
inner_join(gold_slope, by = c("season"))
scenario_3 = bind_rows(scenario_3, gold_data)
performance_3_sum = performance_3 %>%
group_by(season) %>%
summarise("avg_diff" = mean(avg_diff),
"n" = mean(n),
"lat.trend" = mean(lat.trend))
ggplot(scenario_3, aes(x = lat, y = wt_diff, colour = group, group = run)) +
facet_wrap(season~., nrow = 3) +
geom_hline(yintercept = 0) +
geom_smooth(aes(colour = group),
method = "lm", se = F) +
geom_point() +
labs(x = "Latitude",
y = "Predicted - Observed WT") +
theme_matt_facets()

knitr::kable(performance_1, caption = "Scenario 1")
Scenario 1
| early |
2.879537 |
1 |
0.0942793 |
| peak |
3.059815 |
3 |
0.2746916 |
| late |
4.059209 |
6 |
0.2516853 |
knitr::kable(performance_2, caption = "Scenario 2")
Scenario 2
| early |
2.208815 |
1 |
-0.1249784 |
| late |
2.692996 |
5 |
-0.0248105 |
knitr::kable(performance_3_sum, caption = "Scenario 3")
Scenario 3
| peak |
3.713519 |
1.00 |
0.0954369 |
| late |
2.155182 |
1.88 |
0.1651261 |
knitr::kable(gold_performance, caption = "`Gold` Standard")
Gold Standard
| early |
2.795142 |
1 |
0.0766049 |
| peak |
4.837180 |
1 |
0.1476920 |
| late |
3.116444 |
3 |
0.1901852 |
best = bind_rows(
mutate(performance_1, "scenario" = "one"),
mutate(performance_2, "scenario" = "two"),
mutate(performance_3_sum, "scenario" = "three"),
mutate(gold_performance, "scenario" = "gold")) %>%
group_by(season) %>%
filter(abs(lat.trend) == min(abs(lat.trend)))
#filter(avg_diff == min(avg_diff))
Next Steps
After phenotyping, each individual was preserved in 95% ethanol.
Individual DNA libraries will be prepared using Twist Bio 96-plex prep
kits, then sequenced on an Illumina NovaSeq X Plus. Using the
low-coverage whole genome sequences, we will examine seasonal patterns
in allele frequency change, and compare these fine scale temporal
patterns with the larger latitudinal patterns in allele frequency to
determine whether the same alleles driving rapid seasonal adaptation are
in play over larger spatial (and longer temporal) scales.
Misc. Details
ggplot(temp_record, aes(x = minute_passed, y = temp_C, group = factor(run))) +
geom_abline(slope = 0.3, intercept = mean(temp_record[temp_record$minute_interval == 0, 8])) +
geom_abline(slope = 0.1, intercept = mean(temp_record[temp_record$minute_interval == 0, 8])) +
geom_line(linewidth = 0.2, alpha = 0.8) +
geom_point(data = full_data,
aes(x = time, y = ctmax + 0.4),
size = 2,
shape = 25) +
labs(x = "Time passed (minutes)",
y = "Temperature (degrees C)",
fill = "Trial Number") +
guides(colour = "none") +
theme_matt(base_size = 16) +
theme(legend.position = "right")

ramp_record2 = ramp_record %>%
group_by(run, minute_interval) %>%
summarise(mean_ramp = mean(ramp_per_minute)) %>%
ungroup()
ggplot(ramp_record2, aes(x = minute_interval, y = mean_ramp)) +
geom_hline(yintercept = 0.3) +
geom_hline(yintercept = 0.1) +
#geom_point() +
geom_hex(bins = 30) +
ylim(0, 0.35) +
labs(y = "Ramp Rate (deg. C / min.)",
x = "Time into run (minute)") +
theme_matt(base_size = 16)

full_data %>%
drop_na(replicate) %>%
ggplot(aes(x = factor(replicate), y = ctmax, group = site)) +
facet_grid(site~season, scales = "free_y") +
geom_point(position = position_jitter(width = 0.1, height = 0),
alpha = 0.4,
colour = "grey30") +
geom_smooth(method = "lm", colour = "black") +
labs(x = "Replicate",
y = "CTmax") +
theme_matt_facets()

ggplot(haldanes, aes(x = lat, y = gens, colour = site, shape = season)) +
geom_hline(yintercept = 0) +
geom_point(size = 5) +
scale_colour_manual(values = site_cols) +
labs(x = "Latitude",
y = "Generations between \ncollections") +
scale_y_continuous(breaks = seq(from = 0, to = 21, by = 5)) +
theme_matt() +
theme(legend.position = "right")

obs_ranks = ggplot(full_data, aes(x = rank)) +
facet_wrap(tube~.) +
geom_histogram(binwidth = 1) +
scale_x_continuous(breaks = c(2,4,6,8,10)) +
ggtitle("Observation") +
theme_matt_facets()
sim_data = data.frame()
for(i in 1:max(full_data$run)){
rep_data = data.frame("tube" = sample(c(1:10), size = 10, replace = F),
"rank" = c(1:10),
"rep" = i) %>%
arrange(tube)
sim_data = bind_rows(sim_data, rep_data)
}
sim_ranks = ggplot(sim_data, aes(x = rank)) +
facet_wrap(tube~.) +
geom_histogram(binwidth = 1) +
scale_x_continuous(breaks = c(2,4,6,8,10)) +
ggtitle("Simulation") +
theme_matt_facets()
ggarrange(obs_ranks, sim_ranks)

---
title: "Comparing seasonal and latitudinal patterns in thermal adaptation"
date: "`r Sys.Date()`"
output: 
  html_document:
          code_folding: hide
          code_download: true
          toc: true
          toc_float: true
  github_document:
          html_preview: false
          toc: true
          toc_depth: 3
---

```{r}
# TO DO 
# - Framework for quantifying the effects of within- and across-population variation in thermal limits to spatial patterns in vulnerability to warming. Comparing predictions based on 1) median, 2) overall CTmax vs. temp regression, 3) population variation in intercepts, 4) population variation in both slope and intercept. The end metric I could use to compare across scenarios is i) the cumulative amount of underestimation (summed across populations) or ii) the number of sites that have overestimated WT, or iii) the slope of WT (local adaptation and seasonal acclimation should result in more shallow slopes). 
```


```{r setup, include=T, message = F, warning = F, echo = F}

knitr::opts_chunk$set(
  echo = knitr::is_html_output(),
  fig.align = "center",
  fig.path = "../Figures/markdown/",
  dev = c("png", "pdf"),
  message = FALSE,
  warning = FALSE,
  collapse = T
)

theme_matt = function(base_size = 18,
                      dark_text = "grey20"){
  mid_text <-  monochromeR::generate_palette(dark_text, "go_lighter", n_colours = 5)[2]
  light_text <-  monochromeR::generate_palette(dark_text, "go_lighter", n_colours = 5)[3]
  
  theme_pubr(base_family="sans") %+replace% 
    theme(
      panel.background  = element_rect(fill="transparent", colour=NA), 
      plot.background = element_rect(fill="transparent", colour=NA), 
      legend.background = element_rect(fill="transparent", colour=NA),
      legend.key = element_rect(fill="transparent", colour=NA),
      text = element_text(colour = mid_text, lineheight = 1.1),
      title = element_text(size = base_size * 1.5,
                           colour = dark_text),
      axis.text = element_text(size = base_size,
                               colour = mid_text),
      axis.title.x = element_text(size = base_size * 1.2,
                                  margin = unit(c(3, 0, 0, 0), "mm")),
      axis.title.y = element_text(size = base_size * 1.2,
                                  margin = unit(c(0, 5, 0, 0), "mm"), 
                                  angle = 90),
      legend.text = element_text(size=base_size * 0.9),
      legend.title = element_text(size = base_size * 0.9, 
                                  face = "bold"),
      plot.margin = margin(0.25, 0.25, 0.25, 0.25,"cm")
    )
}

theme_matt_facets = function(base_size = 18,
                             dark_text = "grey20"){
  mid_text <-  monochromeR::generate_palette(dark_text, "go_lighter", n_colours = 5)[2]
  light_text <-  monochromeR::generate_palette(dark_text, "go_lighter", n_colours = 5)[3]
  
  theme_bw(base_family="sans") %+replace% 
    theme(
      panel.grid = element_blank(),
      panel.background  = element_rect(fill="transparent", colour=NA), 
      plot.background = element_rect(fill="transparent", colour=NA), 
      legend.background = element_rect(fill="transparent", colour=NA),
      legend.key = element_rect(fill="transparent", colour=NA),
      text = element_text(colour = mid_text, lineheight = 1.1),
      strip.text.x = element_text(size = base_size),
      title = element_text(size = base_size * 1.5,
                           colour = dark_text),
      axis.text = element_text(size = base_size,
                               colour = mid_text),
      axis.title.x = element_text(size = base_size * 1.2,
                                  margin = unit(c(3, 0, 0, 0), "mm")),
      axis.title.y = element_text(size = base_size * 1.2,
                                  margin = unit(c(0, 5, 0, 0), "mm"), 
                                  angle = 90),
      legend.text = element_text(size=base_size * 0.9),
      legend.title = element_text(size = base_size * 0.9, 
                                  face = "bold"),
      plot.margin = margin(0.25, 0.25, 0.25, 0.25,"cm")
    )
}

site_cols = c("Key Largo" = "indianred4", 
              "Manatee River" = "coral", 
              "Ft. Hamer" = "coral3",
              "Tyler Cove" = "goldenrod1",
              "Ganey's Wharf" = "darkgoldenrod3", 
              "Esker Point" = "darkseagreen3",
              "Sawyer Park" = "palegreen4", 
              "St. Thomas de Kent Wharf" = "steelblue2",
              "Ritchie Wharf" = "steelblue4")
```

## Site Characteristics

```{r}
site_temps = full_data %>% 
  dplyr::select(site, lat, season, doy, collection_temp, collection_salinity) %>%  
  distinct() %>% 
  filter(doy > 100) 
```

Copepods were collected by surface tow from sites across the Western Atlantic at several times throughout the year. The sites are shown below. Temperatures at the time of collection were measured using a manual thermometer. Across the entire set of collections, temperature ranged from `r min(site_temps$collection_temp)`°C to `r max(site_temps$collection_temp)`°C.

```{r site-chars, fig.width=10, fig.height=6}
coords = site_data %>%
  dplyr::select(site, long, lat) %>%
  distinct()

site_map = map_data("world") %>% 
  filter(region %in% c("USA", "Canada")) %>% 
  ggplot() + 
  geom_polygon(aes(x = long, y = lat, group = group),
               fill = "lightgrey") + 
  coord_map(xlim = c(-85,-60),
            ylim = c(25, 48)) + 
  geom_point(data = coords,
             mapping = aes(x = long, y = lat, colour = site),
             size = 3) +
  scale_colour_manual(values = site_cols) + 
  labs(x = "Longitude", 
       y = "Latitude") + 
  theme_matt(base_size = 16)

site_temp_plot = ggplot(site_temps, aes(x = doy, y = collection_temp, colour = site)) + 
  geom_line(linewidth = 2) + 
  geom_point(size = 5) +
  scale_colour_manual(values = site_cols) + 
  labs(y = "Temperature (°C)",
       x = "Day of the Year") +
  theme_matt() + 
  theme(legend.position = "right")

ggarrange(site_map, site_temp_plot, common.legend = T, legend = "bottom")
```

Collections aimed to obtain copepods near the onset of peak temperatures, after peak temperatures, and then at low temperatures. Regional data is not available for all sites, so here we've pieced together daily temperature values from either local temperature sensors (sites in Florida and the Chesapeake) and high resolution satellite temperature data (Connecticut, Maine, and the Canadian sites). This satellite data comes from the NOAA 1/4° Daily Optimum Interpolation Sea Surface Temperature (OISST). 

These temperature profiles are shown below, with the temperatures measured during the time of collection included for comparison In several cases collection temperature does not match the recorded daily averages, but the temperature records do give a general sense of the timing of seasonal maxima. In general, the first sample from each site fell just after the site reached the warmest period. The exception to that pattern is in Florida, where collections occurred after an extended period of high temperatures. 

```{r continuous-temps, fig.width=8, fig.height=6}
temp_profiles = temp_profiles %>% 
  mutate(region = fct_relevel(region, "Florida", "Chesapeake", "Connecticut",
                              "Maine", "Shediac", "Miramichi"))

site_temps2 = site_temps %>% 
  mutate(region = case_when(
    site == "Manatee River" ~ "Florida",
    site == "Ft. Hamer" ~ "Florida",
    site == "Tyler Cove" ~ "Chesapeake",
    site == "Ganey's Wharf" ~ "Chesapeake",
    site == "Esker Point" ~ "Connecticut",
    site == "Sawyer Park" ~ "Maine",
    site == "St. Thomas de Kent Wharf" ~ "Shediac",
    site == "Ritchie Wharf" ~ "Miramichi"),
    region = fct_relevel(region, "Florida", "Chesapeake", "Connecticut",
                         "Maine", "Shediac", "Miramichi"))

ggplot(temp_profiles, aes(x = doy, y = temp_c)) + 
  facet_wrap(region~.) + 
  geom_point(data = site_temps2,
             aes(x = doy, y = collection_temp, colour = site),
             size = 3) +
  geom_line() + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Day of the Year", 
       y = "Mean Daily Temp. (°C)") + 
  theme_matt_facets() + 
  theme(legend.position = "none")
```


Exact locations for the sites are provided here. 

```{r site-table}
site_data %>%  
  arrange(lat) %>%  
  select("Site" = site, "Region" = region, "Lat" = lat, "Long" = long) %>% 
  knitr::kable(align = "c")
```

Nested within each of the three regions (South, Central, and Northern regions) are pairs of low and high salinity sites:    

```{r sal-table}
data.frame("Region" = c("South", "Central", "North"),
           "Low Salinity" = c("Ft. Hamer", "Ganey's Wharf", "Ritchie Wharf"),
           "High Salinity" = c("Manatee River", "Tyler Cove", "St. Thomas de Kent Wharf")) %>% 
  knitr::kable(align = "c")
```

\ 

There are fairly well-established divergences between high salinity and low salinity populations of *Acartia tonsa*. These sets of geographically proximate but isolated populations provide independent comparisons of the effects of seasonality. Shown here are the collection conditions for these pairs of sites. Temperature was typically similar across the pairs within each collection, while salinity differences were fairly stable across collections. 

```{r season-sal-comps, fig.width=8, fig.height=8}
season_cols = c("early" = "grey75", 
                "peak" = "grey50", 
                "late" = "grey25")

sal_regions = data.frame(region = rep(c("South", "Central", "North"), each = 2), 
                         site = c("Ft. Hamer", "Manatee River", 
                                  "Ganey's Wharf", "Tyler Cove", 
                                  "Ritchie Wharf", "St. Thomas de Kent Wharf"),
                         salinity = c("low", "high"))

sal_comps = full_data %>% 
  filter(site %in% sal_regions$site) %>% 
  inner_join(sal_regions, by = c("site")) %>% 
  select( region = region.y, site, salinity, season, doy, collection_temp, collection_salinity,
          size, ctmax, warming_tol) %>% 
  mutate(salinity = fct_relevel(salinity, "low", "high"),
         region = fct_relevel(region, "South", "Central", "North"))

sal_comp_temps = sal_comps %>%  
  select(salinity, season, region, collection_temp, collection_salinity) %>% 
  distinct() %>% 
  ggplot(aes(x = salinity, y = collection_temp, colour = season, group = season)) + 
  facet_wrap(region~.) + 
  geom_line(linewidth = 1.5) + 
  geom_point(size = 4) + 
  scale_colour_manual(values = season_cols) + 
  labs(y = "Collection Temp. (°C)",
       x = "") + 
  theme_matt_facets(base_size = 14)

sal_comp_sal = sal_comps %>%  
  select(salinity, season, region, collection_temp, collection_salinity) %>% 
  distinct() %>% 
  ggplot(aes(x = salinity, y = collection_salinity, colour = season, group = season)) + 
  facet_wrap(region~.) + 
  geom_line(linewidth = 1.5) + 
  geom_point(size = 4) + 
  scale_colour_manual(values = season_cols) + 
  labs(y = "Collection Salinity (psu)",
       x = "Salinity") + 
  theme_matt_facets(base_size = 14)

ggarrange(sal_comp_temps, sal_comp_sal, nrow = 2, common.legend = T, legend = "right")

# sal_comps %>%  
#   select(site, salinity, season, region, collection_temp, collection_salinity) %>% 
#   distinct() %>% 
#   ggplot(aes(x = collection_salinity, y = collection_temp, colour = site)) + 
#   facet_grid(region~.) + 
#   geom_point(size = 4) + 
#   #stat_ellipse() +
#   #geom_path(arrow = arrow(length = unit(0.1, "inches"), type = "closed")) + 
#   scale_colour_manual(values = site_cols) + 
#   theme_matt_facets(base_size = 14)
```

The latitudinal gradient covers a wide range of seasonality. Shown below is the temperature range. While based on collection temperatures, and therefore an underestimate of the total seasonal range of temperatures, these patterns are representative of the expected latitudinal gradient in seasonality. 

```{r lat-temp-range-plot, fig.width=8, fig.height=5}
site_temps %>% 
  group_by(site, lat) %>%  
  summarise(temp_range = max(collection_temp) - min(collection_temp)) %>%  
  ggplot(aes(x = lat, y = temp_range)) + 
  geom_point(aes(colour = site),
             size = 3) + 
  scale_color_manual(values = site_cols) + 
  labs(x = "Latitude", 
       y = "Collection Temp. Range (°C)") + 
  theme_matt() + 
  theme(legend.position = "right")
```


## Phenotypic Measurements 

### Critical Thermal Limits

A total of `r dim(all_data)[1]` individuals were examined. Critical thermal limits and body size measurements were made before individuals were preserved in ethanol. We excluded data for `r dim(excluded)[1]` individuals, detailed below. These individuals had either very low CTmax or were, upon re-examination of photographs, identified as juveniles instead of mature females. With these individuals excluded, **the full data set contains `r dim(full_data)[1]` phenotyped individuals**.   

```{r excluded-inds}
excluded %>% 
  select(region, site, season, collection_temp, collection_salinity, replicate, tube, ctmax, size) %>% 
  knitr::kable(align = "c")
```

Critical thermal maxima (CTmax) was measured using a custom setup. The method uses a standard dynamic ramping assay to determine the maximum temperature individuals could sustain normal functioning. This differs from lethal temperatures, and indeed, all individuals observed so far recovered following the assay.

Individuals were rested for one hour after collection before the assay. During the assay, copepods were held in artificial seawater, composed of bottled spring water and Instant Ocean salt mix adjusted to match collection salinities. During the assay, several 'control' individuals were maintained in this solution at ambient temperatures without the temperature ramp to ensure that there was no background mortality. When sorting individuals from the plankton tow contents, they were held in a 50:50 mix of 60 um filtered water from the collection site and artificial seawater as an additional acclimation step. 

Sample sizes varied slightly across experiments, but most sites had 20 individuals measured per season. The major exceptions were the early samples from the Florida sites and the late sample from Sawyer Park (Maine). Only two sets of samples (peak and late) were collected from Fort Hamer and Manatee River. No samples were collected from Key Largo for this project, as *Acartia tonsa* wasn't present in the water during the peak season, likely due to the recent extreme heat event. The late season collection from Sawyer Park occurred after *Acartia tonsa* abundance decreased. Samples from this period were dominated by *Acartia hudsonica* instead. 

```{r sample-size-plot, fig.width=12, fig.height=5}
ggplot(full_data, aes(x = site, fill = site)) + 
  facet_wrap(season~.) + 
  geom_hline(yintercept = c(0,20),
             colour = "grey70") + 
  geom_bar() + 
  scale_fill_manual(values = site_cols) + 
  coord_flip() +
  theme_matt() + 
  theme(legend.position = "none",
        panel.border = element_rect(linewidth = 1,
                                    fill = NA),
        strip.text = element_text(size = 20),
        axis.title.y = element_blank())
```

Shown below are the measured CTmax values. Note: CTmax values for the early season Key Largo copepods were collected at the end of February 2023 as part of a separate project. Body size values were not measured during this project, nor were copepods individually preserved after the experiments. These early season CTmax values are included as a point of comparison. Individual measurements are shown in small points for each collection. The large points indicate the mean values for each collection. 

```{r seasonal-ct-max}
mean_ctmax = full_data %>% 
  group_by(site, season, doy, collection_temp) %>% 
  summarize(mean_ctmax = mean(ctmax),
            median_ctmax = median(ctmax))

ggplot(full_data, aes(x = season, y = ctmax, colour = site)) + 
  geom_line(data = mean_ctmax, 
            aes(y = mean_ctmax, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 1) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.3) + 
  geom_point(data = mean_ctmax, 
             aes(y = mean_ctmax),
             position = position_dodge(width = 0.4),
             size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

```{r doy-ct-max, include = F}
# The same data is shown below, plotted against day of the year instead of season. This accounts for the variable timing of collections across regions (e.g. - the compressed collections from the Northern sites to accomodate the earlier onset of cold temperatures). 

ggplot(filter(full_data, site != "Key Largo"), aes(x = doy, y = ctmax, colour = site)) + 
  geom_line(data = filter(mean_ctmax, site != "Key Largo"), 
            aes(y = median_ctmax, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 1) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.3) + 
  geom_point(data = filter(mean_ctmax, site != "Key Largo"), 
             aes(y = median_ctmax),
             position = position_dodge(width = 0.4),
             size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

CTmax data for each individual site is shown below, plotted against day of the year. 

```{r ctmax-ind-pops-doy, fig.width=8, fig.height=6}
ggplot(full_data, aes(x = doy, y = ctmax, colour = site)) + 
  facet_wrap(.~site, scales = "free") + 
  geom_line(data = mean_ctmax, 
            aes(y = mean_ctmax, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 3, alpha = 0.5) + 
  # geom_line(data = mean_ctmax, 
  #           aes(y = collection_temp, group = site),
  #           position = position_dodge(width = 0.4),
  #           linewidth = 2,
  #           colour = "grey") + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.8) + 
  # geom_point(data = mean_ctmax, 
  #            aes(y = median_ctmax),
  #            position = position_dodge(width = 0.4),
  #            size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Day of Year") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)
```

```{r ctmax-ind-pops-season, fig.width=8, fig.height=6, include = F}
ggplot(full_data, aes(x = season, y = ctmax, colour = site)) + 
  facet_wrap(.~site, scales = "free_y") + 
  geom_line(data = mean_ctmax, 
            aes(y = median_ctmax, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 3, alpha = 0.5) + 
  geom_line(data = mean_ctmax, 
            aes(y = collection_temp, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 2,
            colour = "grey") + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.8) + 
  # geom_point(data = mean_ctmax, 
  #            aes(y = median_ctmax),
  #            position = position_dodge(width = 0.4),
  #            size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)
```

### Warming tolerance

Warming tolerance (the difference between thermal limits and environmental temperatures) is a commonly used metric of climate vulnerability. We calculated this as the difference between measured CTmax values and the collection temperature. Smaller warming tolerance values indicate that populations were nearer to their upper thermal limits, and may therefore be more vulnerable to additional warming. 

```{r seasonal-warming-tol}
mean_wt = full_data %>% 
  group_by(site, season) %>% 
  summarize(mean_wt = mean(warming_tol),
            median_wt = median(warming_tol))

ggplot(full_data, aes(x = season, y = warming_tol, colour = site)) + 
  geom_line(data = mean_wt, 
            aes(y = mean_wt, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 1) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.3) + 
  geom_point(data = mean_wt, 
             aes(y = mean_wt),
             position = position_dodge(width = 0.4),
             size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Warming Tolerance (°C)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

### Body Size

Following the CTmax assay, individuals were photographed for body size measurements. Prosome lengths were measured from these photographs using a scale micrometer and the software ImageJ. These measurements are shown below. As before, large points indicate the mean body size. While less cohesive than CTmax, a general trend of increasing body size with latitude and time of year can be seen. 

```{r seasonal-body-size}
mean_size = full_data %>% 
  group_by(site, season, doy, collection_temp) %>% 
  summarize(mean_size = mean(size),
            median_size = median(size))

ggplot(full_data, aes(x = season, y = size, colour = site)) + 
  geom_line(data = mean_size, 
            aes(y = mean_size, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 1) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.3) + 
  geom_point(data = mean_size, 
             aes(y = mean_size),
             position = position_dodge(width = 0.4),
             size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

```{r doy-body-size, include = F}
ggplot(drop_na(full_data, size), aes(x = doy, y = size, colour = site)) + 
  geom_line(data = drop_na(mean_size, mean_size), 
            aes(y = median_size, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 1) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.3) + 
  geom_point(data = drop_na(mean_size, mean_size), 
             aes(y = median_size),
             position = position_dodge(width = 0.4),
             size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

Shown below is the body size data for each individual site. 

```{r size-ind-pops-doy, fig.width=8, fig.height=6}
ggplot(drop_na(full_data, size), aes(x = doy, y = size, colour = site)) + 
  facet_wrap(.~site) + 
  geom_line(data = drop_na(mean_size, mean_size), 
            aes(y = mean_size, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 3, alpha = 0.5) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.8) + 
  # geom_point(data = mean_ctmax, 
  #            aes(y = median_ctmax),
  #            position = position_dodge(width = 0.4),
  #            size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Day of Year") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)
```

```{r size-ind-pops-season, fig.width=8, fig.height=6, include = F}
ggplot(full_data, aes(x = season, y = size, colour = site)) + 
  facet_wrap(.~site) + 
  geom_line(data = mean_size, 
            aes(y = median_size, group = site),
            position = position_dodge(width = 0.4),
            linewidth = 3, alpha = 0.5) + 
  geom_point(position = position_jitterdodge(jitter.width = 0.1, jitter.height = 0,
                                             dodge.width = 0.4),
             alpha = 0.8) + 
  # geom_point(data = mean_ctmax, 
  #            aes(y = median_ctmax),
  #            position = position_dodge(width = 0.4),
  #            size = 4) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)
```

### Salinity Pair Comparisons 

The three pairs of cross-salinity comparisons do show evidence for fine-scale trait divergence, although there was no consistent pattern in the direction or magnitude of differences. CTmax was similar across sites in the Southern and Central pairs. In the Northern pair, CTmax tended to be slightly lower for individuals from the low salinity site. Size was more variable between the paired sites. In the South, low salinity individuals were consistently smaller than high salinity individuals, despite the similar temperatures. In the Central pair, individuals from the low salinity site tended to be slightly larger than those from the high salinity site, although this varied seasonally. Sizes tended to be more similar across the collections from the Northern pair. 

```{r sal-pair-traits}
sal_comp_ctmax_plot = sal_comps %>% 
  ggplot(aes(x = salinity, y = ctmax, colour = season, group = season)) + 
  facet_wrap(region~.) + 
  geom_point(size = 2,
             position = position_dodge(width = 0.2)) + 
  #geom_line(size = 1.5) + 
  scale_colour_manual(values = season_cols) + 
  labs(y = "CTmax (°C)",
       x = "") + 
  theme_matt_facets(base_size = 14)

sal_comp_size_plot = sal_comps %>% 
  ggplot(aes(x = salinity, y = size, colour = season, group = season)) + 
  facet_wrap(region~.) + 
  geom_point(size = 2, 
             position = position_dodge(width = 0.2)) + 
  #geom_line(size = 1.5) + 
  scale_colour_manual(values = season_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "") + 
  theme_matt_facets(base_size = 14)

ggarrange(sal_comp_ctmax_plot, sal_comp_size_plot, nrow = 2, common.legend = T, legend = "right")

###

sal_comp_ctmax.model = lm(ctmax ~ collection_temp, data = sal_comps)
# summary(ctmax_temp.model)
# car::Anova(ctmax_temp.model)
sal_comp_ctmax_resids = residuals(sal_comp_ctmax.model)

sal_comp_size.model = lm(size ~ collection_temp, data = sal_comps)
# summary(size_temp.model)
# car::Anova(size_temp.model)
sal_comp_size_resids = residuals(sal_comp_size.model)

sal_comp_ctmax_resid_plot = sal_comps %>%
  mutate(ctmax_resids = sal_comp_ctmax_resids,
         size_resids = sal_comp_size_resids) %>%
  ggplot(aes(x = salinity, y = ctmax_resids, colour = season, group = season)) +
  facet_wrap(region~.) +
  geom_point(size = 2,
             position = position_dodge(width = 0.5)) +
  #geom_line(size = 1.5) +
  scale_colour_manual(values = season_cols) +
  labs(y = "CTmax \nResiduals",
       x = "") +
  theme_matt_facets(base_size = 14)

sal_comp_size_resid_plot = sal_comps %>%
  mutate(ctmax_resids = sal_comp_ctmax_resids,
         size_resids = sal_comp_size_resids) %>%
  ggplot(aes(x = salinity, y = size_resids, colour = season, group = season)) +
  facet_wrap(region~.) +
  geom_point(size = 2,
             position = position_dodge(width = 0.5)) +
  #geom_line(size = 1.5) +
  scale_colour_manual(values = season_cols) +
  labs(y = "Prosome Length \nResiduals",
       x = "") +
  theme_matt_facets(base_size = 14)

#ggarrange(sal_comp_ctmax_resid_plot, sal_comp_size_resid_plot, nrow = 2, common.legend = T, legend = "right")
```

## Trait Correlations

Regardless of the underlying mechanism (genetic differentiation or phenotypic plasticity), we expect that collections from warmer waters should yield copepods with higher thermal limits and smaller body sizes. Our observations largely fit this expectation, with strong increases in CTmax at higher temperatures, and a general decrease in prosome lengths as temperature increased. 

```{r temp-cors, fig.width=15, fig.height=6}
ctmax_temp_plot = ggplot(full_data, aes(x = collection_temp, y = ctmax)) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2, 
              colour = "grey") + 
  geom_point(aes(colour = site), 
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "none")

size_temp_plot = ggplot(full_data, aes(x = collection_temp, y = size)) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2, 
              colour = "grey") + 
  geom_point(aes(colour = site), 
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

wt_temp_plot = ggplot(full_data, aes(x = collection_temp, y = warming_tol)) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2, 
              colour = "grey") + 
  geom_point(aes(colour = site), 
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Warming Tolerance (°C)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

ggarrange(ctmax_temp_plot, wt_temp_plot, size_temp_plot, common.legend = T, legend = "bottom", nrow = 1)
```

Shown below are these temperature correlations for each individual population. Variation in the temperature sensitivity of these traits appears to vary across populations, with reduced slopes in both the lowest and the highest latitude populations. Again, we emphasize that this observed trait variation may stem from either (or both) plastic and genetic effects. However, these observations provide estimates for realistic patterns in temperature sensitivity for these populations. 

```{r pop-temp-cors, fig.width=8, fig.height=6}
ggplot(full_data, aes(x = collection_temp, y = ctmax)) + 
  facet_wrap(.~site) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2, 
              colour = "grey") + 
  geom_point(aes(colour = site), 
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "none")

ggplot(full_data, aes(x = collection_temp, y = size)) + 
  facet_wrap(.~site) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2, 
              colour = "grey") + 
  geom_point(aes(colour = site), 
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Prosome Length (mm)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "none")

```

One additional correlation of interest is the relationship between prosome length and CTmax. In many cases, larger body sizes are associated with cold adaptation/acclimation, and there is a general trend of decreasing thermal limits with increasing size. Shown below is the relationship between prosome length and CTmax in our data set. Individual regression lines for each site are also included - the dark grey lines in the background represent the 'universal' regression for that site, with individual colored regression lines for each collection. Across our collections, we see evidence for this relationship, with larger individuals having lower thermal limits.      

```{r ctmax-vs-size, fig.width=6, fig.height=10}
universal_size = full_data %>% 
  ggplot(aes(x = size, y = ctmax)) + 
  # geom_smooth(data = filter(full_data, ctmax > 31), 
  #             aes(x = size, y = ctmax),
  #             method = "lm", 
  #             colour = "grey60", 
  #             se = F,
  #             linewidth = 2) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2,
              colour = "grey70") + 
  geom_point(aes(colour = site),
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax (°C)",
       x = "") +
  theme_matt(base_size = 14) + 
  theme(legend.position = "right",
        axis.title.x = element_blank())

pop_size = full_data %>% 
  ggplot(aes(x = size, y = ctmax, colour = site, group = season)) + 
  facet_wrap(site~.) + 
  # geom_smooth(data = filter(full_data, ctmax > 31), 
  #             aes(x = size, y = ctmax),
  #             method = "lm", 
  #             colour = "grey60", 
  #             se = F,
  #             linewidth = 2) + 
  geom_smooth(data = full_data, 
              aes(x = size, y = ctmax, group = site), 
              colour = "grey20", method = "lm", se = F) + 
  geom_point(size = 1.3, alpha = 0.3) + 
  geom_smooth(method = "lm", se = F,
              linewidth = 1) + 
  scale_colour_manual(values = site_cols) + 
  scale_x_continuous(breaks = c(0.6, 0.8, 1)) + 
  labs(y = "CTmax (°C)",
       x = "Prosome Length (mm)") +
  theme_matt(base_size = 14) + 
  theme(legend.position = "right")

ggarrange(universal_size, pop_size, common.legend = T, legend = "none", nrow = 2)
```

This relationship may be affected by changes in temperature at each site, however, which may affect both body size and thermal limits. If there is a true mechanistic relationship between body size and thermal limits, we would expect to see this relationship emerge **within** populations or even individual collections. Shown below is the relationship between CTmax and size residuals, acquired from regressions of these traits against collection temperature. This substantially reduces the strength of the apparent relationship, but there is still a slightly negative overall relationship, spanning both across-population, within-population, and even within-collection scales (see the Sawyer Park collections, for example).     

```{r ctmax-vs-size-resids, fig.width=6, fig.height=10}
filtered_data = full_data %>% 
  drop_na(size, ctmax) %>% 
  mutate(temp_cent = scale(collection_temp, scale = F),
         sal_cent = scale(collection_salinity, scale = F),
         sal_type = if_else(collection_salinity > 20, "High", "Low"))

ctmax_temp.model = lm(ctmax ~ collection_temp + site, data = filtered_data)
ctmax_resids = residuals(ctmax_temp.model)

size_temp.model = lm(size ~ collection_temp + site, data = filtered_data)
size_resids = residuals(size_temp.model)

universal_resids = filtered_data %>% 
  mutate(ctmax_resids = ctmax_resids,
         size_resids = size_resids) 

all_resids = ggplot(universal_resids, aes(x = size_resids, y = ctmax_resids)) + 
  # geom_smooth(data = filter(full_data, ctmax > 31), 
  #             aes(x = size, y = ctmax),
  #             method = "lm", 
  #             colour = "grey60", 
  #             se = F,
  #             linewidth = 2) + 
  geom_smooth(method = "lm", se = T,
              linewidth = 2,
              colour = "grey70") + 
  geom_point(aes(colour = site),
             size = 2, alpha = 0.7) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Residuals",
       x = "") +
  theme_matt(base_size = 14) + 
  theme(legend.position = "right",
        axis.title.x = element_blank())

pop_resids = ggplot(universal_resids, aes(x = size_resids, y = ctmax_resids, colour = site, group = season)) + 
  facet_wrap(site~.) + 
  # geom_smooth(data = filter(full_data, ctmax > 31), 
  #             aes(x = size, y = ctmax),
  #             method = "lm", 
  #             colour = "grey60", 
  #             se = F,
  #             linewidth = 2) + 
  geom_smooth(aes(x = size_resids, y = ctmax_resids, group = site), 
              colour = "grey20", method = "lm", se = F) + 
  geom_point(size = 1.3, alpha = 0.3) + 
  geom_smooth(method = "lm", se = F,
              linewidth = 1) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Residuals",
       x = "Prosome Length Residuals") +
  theme_matt(base_size = 14) + 
  theme(legend.position = "right")

ggarrange(all_resids, pop_resids, common.legend = T, legend = "none", nrow = 2)
```

```{r ctmax-model, include = F}
# 
# full.model = lm(data = filtered_data, 
#                 ctmax ~ site * collection_temp * size, 
#                    na.action = "na.fail")
# 
# dredge_results = MuMIn::dredge(full.model)
# top_model = MuMIn::get.models(dredge_results, 1)[[1]] #Best model
# 
# temp_vals = as_tibble(emtrends(top_model, spec = "site", var = "collection_temp")) 
# size_vals = as_tibble(emtrends(top_model, spec = "site", var = "size")) 

ctmax.model = lme4::lmer(
  data = filtered_data, 
  ctmax ~ temp_cent + size + sal_type + (1 + temp_cent|site))
```

To more formally test the relationships between CTmax, collection temperature, and size, we used a linear mixed effects model, structured as `ctmax ~ collection_temp + size + salinity_type + (1|site)`. This examines the effects of temperature and size on CTmax, along with differences between the salinity groupings. Collection temperature was centered and salinity type assigned ("low" salinity as anything below 20 psu, "high" salinity as anything above 20 psu) before model fitting. The model also includes random intercepts for each site and random slopes for collection temperature (i.e. - variation in the acclimation capacity of CTmax). 

Collection temperature and body size both had a significant effect on CTmax, but salinity type did not. The overall effect of temperature suggests an increase in CTmax of `r round(unname(fixef(ctmax.model)["temp_cent"]), digits = 2)`°C per °C increase in collection temperature (i.e. - an ARR value of `r round(unname(fixef(ctmax.model)["temp_cent"]), digits = 2)`), while increasing body sizes decrease CTmax by `r round(unname(fixef(ctmax.model)["size"]), digits = 2)`°C per mm (or a decrease of ~`r round(unname(fixef(ctmax.model)["size"]), digits = 2)/10`°C per tenth of a mm, which is more biologically realistic for *A. tonsa*). While not significant, the model suggests low salinity sites had lower thermal limits by ~`r abs(round(unname(fixef(ctmax.model)["sal_typeLow"]), digits = 1))`°C.

```{r}

#summary(ctmax.model)

effects_summary = data.frame(
  "Temperature" = unname(fixef(ctmax.model)["temp_cent"]),
  "Size" = unname(fixef(ctmax.model)["size"]),
  "Salinity" = unname(fixef(ctmax.model)["sal_typeLow"]))

knitr::kable(effects_summary)
```

By extracting the conditional mode for the random effects, we can also examine how thermal limits vary across sites beyond the influence of collection temperatures and body sizes. Shown below are these values, extracted from the linear mixed effects model. We can see that, similar to what's been observed in common garden experiments with *A. tonsa* previously, significant divergences are present at only a few sites, with Fort Hamer and Ritchie Wharf having increased and decreased thermal limits respectively. Interestingly, both of these sites were low salinity sites, also in line with previous results suggesting gene flow between high salinity sites may constrain differentiation. 

```{r pop-effs-plot, fig.width=9, fig.height=6}
pop_effs = REsim(ctmax.model) %>% 
  dplyr::select("site" = groupID, term, mean, sd) %>% 
  filter(term == "(Intercept)") %>% 
  inner_join(site_data, by = c("site")) %>% 
  mutate(site = fct_reorder(site, lat))

#plotREsim(REsim(ctmax.model))  # plot the interval estimates

ggplot(pop_effs, aes(x = lat, y = mean, colour = site)) + 
  geom_hline(yintercept = 0) +
  geom_errorbar(aes(ymin = mean - 1.96 * sd, ymax = mean + 1.96 * sd),
                width = 0.5, linewidth = 1) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Latitude", 
       y = "Population Effect") + 
  theme_matt() + 
  theme(legend.position = "right")
```

Finally, shown below are the estimated random slopes for each site. These represent the effects of collection temperature on CTmax for each site. Interestingly, these estimates diverge from the results of previous common garden experiments, which showed the strongest plasticity in high latitude sites. Here, acclimation appears to peak in mid-latitudes, and decrease at both high and low latitude sites. 

```{r site-arr-plot, fig.width=6, fig.height=4}
coefficients(ctmax.model)$site %>%
  janitor::clean_names() %>%
  rownames_to_column(var = "site") %>%
  inner_join(site_data) %>% 
  mutate(site = fct_reorder(site, lat)) %>% 
  ggplot(aes(x = temp_cent, y = site)) +
  geom_point(aes(colour = site),
             size = 5) +
  scale_colour_manual(values = site_cols) +
  labs(x = "ARR") + 
  theme_matt() +
  theme(legend.position = "none",
        axis.title.y = element_blank())
```

## Trait Variability

Shown below is the trait variation (ranges) for each site. Ranges are calculated for each collection separately. 

```{r trait-range-plot, fig.width=12, fig.height=4.5}
trait_ranges = full_data %>% 
  group_by(site, season, collection_temp, collection_salinity, doy, lat) %>% 
  summarise(mean_ctmax = mean(ctmax),
            ctmax_range = max(ctmax) - min(ctmax),
            ctmax_var = var(ctmax),
            mean_size = mean(size),
            size_range = max(size) - min(size),
            size_var = var(size)) %>% 
  mutate(prop_ctmax_range = ctmax_range / mean_ctmax,
         prop_size_range = size_range / mean_size)

ctmax_range_temp = ggplot(trait_ranges, aes(x = collection_temp, y = ctmax_range, colour = site)) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Range (°C)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

ctmax_var_temp = ggplot(trait_ranges, aes(x = collection_temp, y = ctmax_var, colour = site)) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Range (°C)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

size_range_temp = ggplot(trait_ranges, aes(x = collection_temp, y = size_range, colour = site)) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Size Range (mm)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

size_var_temp = ggplot(trait_ranges, aes(x = collection_temp, y = size_var, colour = site)) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "Size Range (mm)",
       x = "Collection Temp. (°C)") +
  theme_matt() + 
  theme(legend.position = "right")

ggarrange(ctmax_range_temp, size_range_temp, common.legend = T, legend = "right")
```

Changes in trait variance may be indicative of phenotypic selection. If selection (as opposed to acclimation) are driving seasonal changes, we may expect to see a reduction in variance in the peak samples relative to the early season samples. Note that early season collection temperatures this year were higher than expected, driven by fairly strong heatwaves across the North Atlantic. As shown in the temperature profiles for each site, the 'early' samples were collected just after high temperatures were reached, while 'peak' samples were collected after sites had experienced high temperatures for several weeks (generations). As warming tolerances were fairly high throughout this period, we will assume that selection was weak before the early samples. If the early onset of high temperatures filtered out vulnerable genotypes prior to our sampling, the results will be a conservative estimate of the effects of selection on trait variance.     

Shown below is the seasonal progression of variance in CTmax for each site. For many sites, variance decreased between the early and peak samples, and then increased again in the late sample. For some sites (e.g. Esker Point), this increase in the late sample was substantial. 

```{r season-var}
ggplot(trait_ranges, aes(x = season, y = ctmax_var, colour = site)) + 
  geom_line(aes(group = site), 
            linewidth = 1.5) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Variance",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

Shown below is the seasonal progression of variance in body size. A similar pattern of decreasing variance in peak samples relative to early and late samples is again seen for many sites. The obvious exception is the Esker Point sample, which saw the opposite trend. 

```{r}
ggplot(trait_ranges, aes(x = season, y = size_var, colour = site)) + 
  geom_line(aes(group = site), 
            linewidth = 1.5) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Variance",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)
```

Shown below are the seasonal changes in trait variance for each site individually. 

```{r var-ind-pops-season, fig.width=8, fig.height=6}
ggplot(trait_ranges, aes(x = season, y = ctmax_var, colour = site)) + 
  facet_wrap(site~.) + 
  geom_line(aes(group = site), 
            linewidth = 1.5) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Variance",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)

ggplot(trait_ranges, aes(x = season, y = size_var, colour = site)) + 
  facet_wrap(site~.) + 
  geom_line(aes(group = site), 
            linewidth = 1.5) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(y = "CTmax Variance",
       x = "Season") +
  theme_matt() + 
  theme(legend.position = "none", 
        legend.title.align = 0.125)
```

```{r var-change-temp-change, include = F}
var_change_data = trait_ranges %>%  
  ungroup() %>% 
  mutate(mean_wt = mean_ctmax - collection_temp) %>% 
  group_by(site) %>% 
  arrange(site, doy) %>%  
  mutate(temp_change = collection_temp - lag(collection_temp),
         ctmax_change = mean_ctmax - lag(mean_ctmax),
         wt_change = mean_wt - lag(mean_wt),
         var_change = ctmax_var - lag(ctmax_var)) %>%  
  select(site, season, doy, lat, temp_change, var_change, ctmax_change, wt_change)

ggplot(var_change_data, aes(x = temp_change, y = var_change)) +
  geom_hline(yintercept = 0) + 
  geom_vline(xintercept = 0) +
  geom_smooth(method = "lm") +
  geom_point(aes(colour = site),
             size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Temperature Change (°C)",
       y = "Change in CTmax Variance") + 
  theme_matt() + 
  theme(legend.position = "right", 
        legend.title.align = 0.125)

var_change_data %>% 
  mutate(sample_arr = ctmax_change/temp_change) %>% 
  select(site, season, temp_change, sample_arr) %>% 
  drop_na() %>% 
  ggplot(aes(x = temp_change, y = sample_arr)) + 
  geom_point()

var_change_data %>% 
  mutate(sample_arr = ctmax_change/temp_change) %>% 
  select(site, season, temp_change, sample_arr) %>% 
  drop_na() %>% 
  ggplot(aes(x = sample_arr)) + 
  geom_histogram(binwidth = 0.1)

```

## Comparing rates of change
Both CTmax and body size varied between sites and across seasons. It can be difficult to directly compare these two traits. We take two approaches to ease this comparison. 
Shown below is a comparison of the slopes from the trait regressions against collection temperature for each population, standardized by the standard deviation of the trait for each population (across all collections). This presents change per degree change in collection temperature in units of standard deviations for both CTmax and body size.

```{r adj-slope-comp, fig.width=7, fig.height=6}
adj_slopes = full_data %>% 
  group_by(site, lat) %>% 
  arrange(doy) %>%  
  filter(site != "Key Largo") %>%
  summarize("ctmax_slope" = coef(lm(ctmax ~ collection_temp))["collection_temp"], 
            "mean_ctmax" = mean(ctmax),
            "ctmax_sd" = sd(ctmax),
            "size_slope" = coef(lm(size ~ collection_temp))["collection_temp"], 
            "mean_size" = mean(size),
            "size_sd" = sd(size), 
            "temp_range" = max(collection_temp) - min(collection_temp)) %>%  
  drop_na() %>% 
  mutate(adj_ctmax_slope = ctmax_slope / ctmax_sd,
         adj_size_slope = size_slope / size_sd) %>% 
  pivot_longer(cols = contains("_slope"), 
               names_to = "slope_type",
               values_to = "slope")

# ggplot(adj_slopes, aes(x = lat, y = temp_range)) + 
#   geom_point() + 
#   theme_matt()

ggplot(filter(adj_slopes, str_detect(slope_type, "adj_")), aes(x = slope_type, y = abs(slope), 
                                                               group = site, colour = site)) + 
  geom_hline(yintercept = 0) + 
  geom_line(linewidth = 1) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "", 
       y = "Slope (absolute value)") + 
  theme_matt() + 
  theme(legend.position = "right",
        axis.text.x = element_text(angle = 300, hjust = 0, vjust = 0.5))
```

Haldanes are a similar unit, representing change in units of standard deviations per generation. This can be a useful metric for comparing across traits, especially as the number of generations covered by our sampling period likely varies across populations. The calculation of haldanes is taken from Hendry and Kinnison (1999), which in turn is based on work from Gingerich (1993). We estimated the number of generations passed between collections using the empirical relationship between temperature and development time for *Acartia tonsa* from Leandro et al. (2006). For initial estimates, we used a temperature halfway between what was observed during collection, although this estimate can be improved by using non-linear averaging to account for Jenzen's Inequality and the effect of temperature variation on rate functions. Changes were examined for each pair of collections (early to peak, and peak to late).    

Shown below is a comparison of the estimated haldane values for CTmax and body size, separated by season. Keep in mind that while this metric accounts for differences in the number of generations between collections, it does not directly account for differences in temperature, leading to inflated values in the "peak to late" comparisons, which typically covered a larger range of temperatures. 

```{r haldane-comp-plot, fig.height=6, fig.width=12}
early_peak = full_data %>% 
  filter(season %in% c("early", "peak")) %>% 
  mutate(season = if_else(season == "early", "one", "two")) %>% 
  group_by(site) %>% 
  mutate(ctmax_sd_p = sd(ctmax),
         size_sd_p = sd(size), 
         temp_change = max(collection_temp) - min(collection_temp),
         avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
         days_passed = max(doy) - min(doy)) %>% 
  select(site, lat, season, 
         ctmax_sd_p, size_sd_p, 
         temp_change, avg_temp, days_passed, 
         ctmax, size) %>%
  group_by(site, lat, season, 
           ctmax_sd_p, size_sd_p, 
           temp_change, avg_temp, days_passed) %>% 
  summarize(ctmax = mean(ctmax),
            size = mean(size)) %>% 
  pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p, 
                          temp_change, avg_temp, days_passed), 
              names_from = season, 
              values_from = c(ctmax, size)) %>% 
  mutate(season = "early_to_peak") %>%  
  drop_na()

peak_late = full_data %>% 
  filter(season %in% c("peak", "late")) %>% 
  mutate(season = if_else(season == "peak", "one", "two")) %>% 
  group_by(site) %>% 
  mutate(ctmax_sd_p = sd(ctmax),
         size_sd_p = sd(size), 
         temp_change = last(collection_temp) - first(collection_temp),
         avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
         days_passed = max(doy) - min(doy)) %>% 
  select(site, lat, season, ctmax_sd_p, size_sd_p, 
         temp_change, avg_temp, days_passed, 
         ctmax, size) %>%
  group_by(site, lat, season, ctmax_sd_p, size_sd_p, 
           temp_change, avg_temp, days_passed) %>% 
  summarize(ctmax = mean(ctmax),
            size = mean(size)) %>% 
  pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p, 
                          temp_change, avg_temp, days_passed), 
              names_from = season, 
              values_from = c(ctmax, size)) %>% 
  mutate(season = "peak_to_late") %>%  
  drop_na()

calc_halds = function(x1, x2, sd_p, g){
  ((x2 / sd_p) - (x1 / sd_p)) / g
}

haldanes = bind_rows(early_peak, peak_late) %>% 
  mutate("gen_time" = 5490*(avg_temp + 1)^-2.05, 
         "gens" = floor(days_passed / gen_time),
         "ctmax_haldanes" = calc_halds(x2 = ctmax_two, x1 = ctmax_one, 
                                       sd_p = ctmax_sd_p, g = gens),
         "size_haldanes" = calc_halds(x2 = size_two, x1 = size_one, 
                                      sd_p = size_sd_p, g = gens))

# haldanes %>% 
#   ungroup() %>% 
#   select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>% 
#   pivot_longer(cols = c(ctmax_haldanes, size_haldanes),
#                names_to = c("type", NA), 
#                names_sep = "_",
#                values_to = "haldanes") %>% 
#   ggplot(aes(x = type, y = haldanes, group = site, colour = site)) + 
#   facet_wrap(season~.) + 
#   geom_hline(yintercept = 0) + 
#   geom_line(aes(linewidth = desc(temp_change))) + 
#   scale_colour_manual(values = site_cols) + 
#   labs(x = "Trait", 
#        y = "Haldanes", 
#        linewidth = "Temp. Change") + 
#   theme_matt_facets()

ctmax_halds_plot = haldanes %>% 
  ungroup() %>% 
  select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%   
  ggplot(aes(x = season, y = ctmax_haldanes, colour = site, group = site)) + 
  geom_hline(yintercept = 0, colour = "grey70") + 
  geom_line(linewidth = 2) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Season",
       y = "Haldanes") + 
  ggtitle("CTmax") + 
  theme_matt() + 
  theme(legend.position = "right")

size_halds_plot = haldanes %>% 
  ungroup() %>% 
  select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%   
  ggplot(aes(x = season, y = size_haldanes, colour = site, group = site)) + 
  geom_hline(yintercept = 0, colour = "grey70") + 
  geom_line(linewidth = 2) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Season",
       y = "Haldanes") + 
  ggtitle("Size") + 
  theme_matt() + 
  theme(legend.position = "right")

ggarrange(ctmax_halds_plot, size_halds_plot, common.legend = T, legend = "bottom")
```

```{r haldane-resids-comp-plot, fig.height=3.5, fig.width=9, include = F}
early_peak_resids = universal_resids %>% 
  filter(season %in% c("early", "peak")) %>% 
  mutate(season = if_else(season == "early", "one", "two")) %>% 
  group_by(site) %>% 
  mutate(ctmax_sd_p = sd(ctmax_resids),
         size_sd_p = sd(size_resids), 
         temp_change = max(collection_temp) - min(collection_temp),
         avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
         days_passed = max(doy) - min(doy)) %>% 
  select(site, lat, season, 
         ctmax_sd_p, size_sd_p, 
         temp_change, avg_temp, days_passed, 
         ctmax_resids, size_resids) %>%
  group_by(site, lat, season, 
           ctmax_sd_p, size_sd_p, 
           temp_change, avg_temp, days_passed) %>% 
  summarize(ctmax = mean(ctmax_resids),
            size = mean(size_resids)) %>% 
  pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p, 
                          temp_change, avg_temp, days_passed), 
              names_from = season, 
              values_from = c(ctmax, size)) %>% 
  mutate(season = "early_to_peak") %>%  
  drop_na()

peak_late_resids = universal_resids %>% 
  filter(season %in% c("peak", "late")) %>% 
  mutate(season = if_else(season == "peak", "one", "two")) %>% 
  group_by(site) %>% 
  mutate(ctmax_sd_p = sd(ctmax_resids),
         size_sd_p = sd(size_resids), 
         temp_change = last(collection_temp) - first(collection_temp),
         avg_temp = (max(collection_temp) + min(collection_temp)) / 2,
         days_passed = max(doy) - min(doy)) %>% 
  select(site, lat, season, ctmax_sd_p, size_sd_p, 
         temp_change, avg_temp, days_passed, 
         ctmax_resids, size_resids) %>%
  group_by(site, lat, season, ctmax_sd_p, size_sd_p, 
           temp_change, avg_temp, days_passed) %>% 
  summarize(ctmax = mean(ctmax_resids),
            size = mean(size_resids)) %>% 
  pivot_wider(id_cols = c(site, lat, ctmax_sd_p, size_sd_p, 
                          temp_change, avg_temp, days_passed), 
              names_from = season, 
              values_from = c(ctmax, size)) %>% 
  mutate(season = "peak_to_late") %>%  
  drop_na()

calc_halds = function(x1, x2, sd_p, g){
  ((x2 / sd_p) - (x1 / sd_p)) / g
}

haldanes_resids = bind_rows(early_peak_resids, peak_late_resids) %>% 
  mutate("gen_time" = 5490*(avg_temp + 1)^-2.05, 
         "gens" = floor(days_passed / gen_time),
         "ctmax_haldanes" = calc_halds(x2 = ctmax_two, x1 = ctmax_one, 
                                       sd_p = ctmax_sd_p, g = gens),
         "size_haldanes" = calc_halds(x2 = size_two, x1 = size_one, 
                                      sd_p = size_sd_p, g = gens))

# haldanes_resids %>% 
#   ungroup() %>% 
#   select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>% 
#   pivot_longer(cols = c(ctmax_haldanes, size_haldanes),
#                names_to = c("type", NA), 
#                names_sep = "_",
#                values_to = "haldanes") %>% 
#   ggplot(aes(x = type, y = haldanes, group = site, colour = site)) + 
#   facet_wrap(season~.) + 
#   geom_hline(yintercept = 0) + 
#   geom_line(aes(linewidth = desc(temp_change))) + 
#   scale_colour_manual(values = site_cols) + 
#   labs(x = "Trait", 
#        y = "Haldanes", 
#        linewidth = "Temp. Change") + 
#   theme_matt_facets()


resids_ctmax_halds_plot = haldanes_resids %>% 
  ungroup() %>% 
  select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%   
  ggplot(aes(x = season, y = ctmax_haldanes, colour = site, group = site)) + 
  geom_hline(yintercept = 0, colour = "grey70") + 
  geom_line(linewidth = 2) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Season",
       y = "Haldanes") + 
  ggtitle("CTmax") + 
  theme_matt() + 
  theme(legend.position = "right")

resids_size_halds_plot = haldanes_resids %>% 
  ungroup() %>% 
  select(site, temp_change, season, ctmax_haldanes, size_haldanes) %>%   
  ggplot(aes(x = season, y = size_haldanes, colour = site, group = site)) + 
  geom_hline(yintercept = 0, colour = "grey70") + 
  geom_line(linewidth = 2) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Season",
       y = "Haldanes") + 
  ggtitle("Size") + 
  theme_matt() + 
  theme(legend.position = "right")

ggarrange(resids_ctmax_halds_plot, resids_size_halds_plot, common.legend = T, legend = "bottom")
```

```{r haldanes-lat-plot, fig.height=10, fig.width=8, include = F}
# Shown below are the haldane values plotted against latitude. Note that even though large changes in temperature occurred between peak and late samples in the Chesapeake, the change in haldanes is relatively small, while in the Northern populations, changes are larger, though more variable. 

ctmax_haldanes = ggplot(haldanes, aes(x = lat, y = ctmax_haldanes, colour = site, shape = season)) + 
  geom_hline(yintercept = 0) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Latitude",
       y = "Change in CTmax (haldanes)") + 
  theme_matt_facets()

size_haldanes = ggplot(haldanes, aes(x = lat, y = size_haldanes, colour = site, shape = season)) + 
  geom_hline(yintercept = 0) + 
  geom_point(size = 3) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Latitude",
       y = "Change in Size (haldanes)") + 
  theme_matt_facets()

ggarrange(ctmax_haldanes, size_haldanes, common.legend = T, legend = "right", nrow = 2)
```

## Why does intraspecific data matter? 

Thermal limits vary substantially across both spatial and temporal scales in this species, highlighting the importance of considering both intraspecific and temporal variation in thermal limits for predictions of vulnerability to climate change. Single point estimates of thermal limits (as commonly used in larger, general analyses across taxa) obscure this crucial variation, and may bias our estimates of spatial patterns in vulnerability. Here we explore three separate scenarios to illustrate and quantify the importance of this intraspecific vulnerability. 

### Scenario 1 - Invariant thermal limits

The first scenario assumes that thermal limits are constant across both spatial and temporal axes (i.e. a single point estimate of the thermal limit for this species). Here we selected a central population (the high salinity Chesapeake Bay site), and used the average thermal limit from the peak season sample as our 'representative' thermal limit. This approach is similar to that used in Bennet et al. to compile the GlobTherm dataset. These thermal limits are used to re-estimate warming tolerance for each collection (mean thermal limit - collection temperature). We then compared this predicted warming tolerance with the actual observed warming tolerances from each collection. A positive difference indicates an overestimated warming tolerance (the population is actually closer to their thermal limits than would be predicted from the estimated value, and therefore more vulnerable). A negative difference indicates an underestimated warming tolerance (the population is further from their thermal limit than would be predicted, and therefore less vulnerable). 

Both overestimates and underestimates can be problematic for accurate management and conservation strategies. We summarize each of the scenarios using 1) the number of populations with a difference between estimates >2°C in either direction, 2) the average magnitude of difference for that subset of populations, and 3) the slope of the difference against latitude. Effective estimation strategies will have a small number of populations with under- or over-estimated warming tolerance, a small magnitude difference between predicted and observed warming tolerance, and a shallow latitudinal slope. 

In this first scenario (single point estimate of thermal limits), the effectiveness of the estimate varied across latitude and across seasons. During the early season, thermal limits from the central site were a decent predictor of warming tolerance at the other sites, and there was only a slight latitudinal trend. This latitudinal trend increased, however, during the peak and late season collections, driven by increasingly large differences in the northern sites (indicating increased vulnerability relative to predictions in these sites). During the peak season collection, warming tolerance in the southern sites was underestimated by several degrees (these populations were less vulnerable than predicted by the central site thermal limits). 

```{r}
# Compare estimated warming tolerance "ranges" when: 1) CTmax for "average" collection is used; 2) When CTmax for one collection per population is used; and 3) When all collections are used. The idea is to show that not accounting for intra-specific and intra-population variation leads to incorrect predictions of vulnerability to warming because this variation can be substantial - across populations within each seasonal collection, there is at least 5°C variation in thermal limits, while across collections within populations, acclimation to changes in temperature can drive substantial variation. 

## Scenario 1 - single point estimates 

est_1 = full_data %>% 
  group_by(site, season) %>% 
  summarise("mean_ctmax" = mean(ctmax)) %>% 
  filter(site == "Tyler Cove", season == "peak")

scenario_1 = full_data %>% 
  mutate(rep_ctmax = est_1$mean_ctmax,
         pred_wt = rep_ctmax - collection_temp, 
         wt_diff = pred_wt - warming_tol)

ggplot(scenario_1, aes(x = lat, y = wt_diff)) + 
  facet_wrap(season~., nrow = 3) + 
  geom_hline(yintercept = 0) + 
  geom_smooth(method = "lm") + 
  geom_point() + 
  labs(x = "Latitude", 
       y = "Predicted - Observed WT") + 
  theme_matt_facets()

lat.model1 = lm(data = scenario_1,
                wt_diff ~ lat*season)

lat_slope_1 = emmeans::emtrends(lat.model1, var = "lat", specs = "season") %>% 
  as.data.frame() %>% 
  select(season, lat.trend)

performance_1 = scenario_1 %>% 
  select(site, lat, season, wt_diff) %>%  
  group_by(site, season, lat) %>% 
  summarise("mean_diff" = mean(wt_diff),
            "abs_diff" = abs(mean_diff)) %>% 
  ungroup() %>% 
  mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>% 
  filter(flag == "yes") %>%  
  group_by(season) %>% 
  summarise("avg_diff" = mean(abs_diff),
            "n" = n()) %>% 
  inner_join(lat_slope_1, by = "season")
```

### Scenario 2 - Seasonally invariant thermal limits

Local adaptation of thermal limits is widely observed across a range of taxa, including *Acartia tonsa*. In the second scenario, we account for this by using average thermal limits from the peak season for each population in the estimates of warming tolerance throughout the year. 

Unsurprisingly, this approach eliminates the latitudinal trend. Instead we see that peak season estimates were generally decent predictors of warming tolerance during the early season (although there were slight overestimates in several populations), and slightly underestimated warming tolerance during the late season.

```{r}
est_2 = full_data %>% 
  group_by(site, season) %>% 
  summarise("mean_ctmax" = mean(ctmax)) %>% 
  filter(season == "peak") %>% 
  select(site, mean_ctmax)

scenario_2 = full_data %>% 
  inner_join(est_2, by = c("site")) %>% 
  mutate(pred_wt = mean_ctmax - collection_temp, 
         wt_diff = pred_wt - warming_tol)

ggplot(scenario_2, aes(x = lat, y = wt_diff)) + 
  facet_wrap(season~., nrow = 3) + 
  geom_hline(yintercept = 0) + 
  geom_smooth(method = "lm") + 
  geom_point() + 
  labs(x = "Latitude", 
       y = "Predicted - Observed WT") + 
  theme_matt_facets()

lat.model2 = lm(data = scenario_2,
                wt_diff ~ lat*season)

lat_slope_2 = emmeans::emtrends(lat.model2, var = "lat", specs = "season") %>% 
  as.data.frame() %>% 
  select(season, lat.trend)

performance_2 = scenario_2 %>% 
  select(site, lat, season, wt_diff) %>%  
  group_by(site, season, lat) %>% 
  summarise("mean_diff" = mean(wt_diff),
            "abs_diff" = abs(mean_diff)) %>% 
  ungroup() %>% 
  mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>% 
  filter(flag == "yes") %>%  
  group_by(season) %>% 
  summarise("avg_diff" = mean(abs_diff),
            "n" = n()) %>%  
  inner_join(lat_slope_2, by = c("season"))
```

### Scenario 3 - Population sub-sampling 

Both of the previous approaches to estimating warming tolerance result in overestimates of warming tolerance. These reductive methods increase the feasibility, but are unable to account for the co-occuring shifts in ambient temperature and thermal limits. Continuous in-situ monitoring of thermal limits is impractical, however, especially for species with small popuation sizes and/or very large range distributions. One potential compromise solution is to sub-sample populations and use observed data to predict spatial and seasonal changes in warming tolerance. 

In this third approach, we randomly selected nine collections, fit a linear model of CTmax ~ collection temperature, and used this regression to predict thermal limits and warming tolerance across the full set of collections. These predicted warming tolerance values were then compared against observed warming tolerance as before. We repeated this process 100 times (100 random sets of 9 collections) to examine the sensitivity of this approach the populations and seasons collected. In addition to this random data, we also included a scenario where all seasonal collections from Ft. Hamer, Tyler Cove, and Miramichi (the latitudinal extremes and a central point) were used to predict thermal limits. 

```{r}

scenario_3 = data.frame()
performance_3 = data.frame()

for(i in 1:100){
  
  est_3 = full_data %>% 
    group_by(site, season, collection_temp) %>% 
    summarise("mean_ctmax" = mean(ctmax), .groups = "keep") %>% 
    ungroup() %>% 
    filter(row_number() %in% sample(c(1:max(row_number())), size = 9, replace = F))
  
  rep.model = lm(data = est_3, mean_ctmax ~ collection_temp)
  
  rep_data = full_data %>% 
    group_by(site, season) %>%  
    mutate(mean_wt = mean(warming_tol)) %>% 
    select(site, season, collection_temp, lat, mean_wt) %>% 
    ungroup() %>% 
    distinct() %>%  
    mutate(pred_ctmax = predict(rep.model, newdata = .),
           pred_wt = pred_ctmax - collection_temp,
           wt_diff = pred_wt - mean_wt,
           run = i,
           group = "random")
  
  scenario_3 = bind_rows(scenario_3, rep_data)
  
  lat.model3 = lm(data = scenario_3,
                  wt_diff ~ lat*season)
  
  lat_slope_3 = emmeans::emtrends(lat.model3, var = "lat", specs = "season") %>% 
    as.data.frame() %>% 
    select(season, lat.trend)
  
  rep_performance = scenario_3 %>% 
    select(site, lat, season, wt_diff) %>%  
    group_by(site, season, lat) %>% 
    summarise("mean_diff" = mean(wt_diff),
              "abs_diff" = abs(mean_diff), 
              .groups = "keep") %>% 
    ungroup() %>% 
    mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>% 
    filter(flag == "yes") %>%  
    group_by(season) %>% 
    summarise("avg_diff" = mean(abs_diff),
              "n" = n(),
              .groups = "keep") %>%  
    inner_join(lat_slope_3, by = c("season"))
  
  performance_3 = bind_rows(performance_3, rep_performance)
  
}

gold_stand = full_data %>% 
  group_by(site, season, collection_temp) %>% 
  summarise("mean_ctmax" = mean(ctmax), .groups = "keep") %>% 
  ungroup() %>% 
  filter(site %in% c("Ft. Hamer", "Tyler Cove", "Miramichi"))

gold.model = lm(data = gold_stand, mean_ctmax ~ collection_temp)

gold_data = full_data %>% 
  group_by(site, season) %>%  
  mutate(mean_wt = mean(warming_tol)) %>% 
  select(site, season, collection_temp, lat, mean_wt) %>% 
  ungroup() %>% 
  distinct() %>%  
  mutate(pred_ctmax = predict(gold.model, newdata = .),
         pred_wt = pred_ctmax - collection_temp,
         wt_diff = pred_wt - mean_wt,
         run = i + 1,
         group = "gold")

gold.model = lm(data = gold_data,
                wt_diff ~ lat*season)

gold_slope = emmeans::emtrends(gold.model, var = "lat", specs = "season") %>% 
  as.data.frame() %>% 
  select(season, lat.trend)

gold_performance = gold_data %>% 
  select(site, lat, season, wt_diff) %>%  
  group_by(site, season, lat) %>% 
  summarise("mean_diff" = mean(wt_diff),
            "abs_diff" = abs(mean_diff), 
            .groups = "keep") %>% 
  ungroup() %>% 
  mutate("flag" = if_else(abs_diff >= 2, "yes", "no")) %>% 
  filter(flag == "yes") %>%  
  group_by(season) %>% 
  summarise("avg_diff" = mean(abs_diff),
            "n" = n(),
            .groups = "keep") %>%  
  inner_join(gold_slope, by = c("season"))

scenario_3 = bind_rows(scenario_3, gold_data)

performance_3_sum = performance_3 %>%  
  group_by(season) %>%  
  summarise("avg_diff" = mean(avg_diff),
            "n" = mean(n),
            "lat.trend" = mean(lat.trend))

ggplot(scenario_3, aes(x = lat, y = wt_diff, colour = group, group = run)) + 
  facet_wrap(season~., nrow = 3) + 
  geom_hline(yintercept = 0) + 
  geom_smooth(aes(colour = group), 
              method = "lm", se = F) + 
  geom_point() + 
  labs(x = "Latitude", 
       y = "Predicted - Observed WT") + 
  theme_matt_facets()

```

```{r}
knitr::kable(performance_1, caption = "Scenario 1")

knitr::kable(performance_2, caption = "Scenario 2")

knitr::kable(performance_3_sum, caption = "Scenario 3")

knitr::kable(gold_performance, caption = "`Gold` Standard")
```

```{r}
best = bind_rows(
  mutate(performance_1, "scenario" = "one"),
  mutate(performance_2, "scenario" = "two"),
  mutate(performance_3_sum, "scenario" = "three"),
  mutate(gold_performance, "scenario" = "gold")) %>% 
  group_by(season) %>%  
  filter(abs(lat.trend) == min(abs(lat.trend)))
  #filter(avg_diff == min(avg_diff))
```


## Next Steps

After phenotyping, each individual was preserved in 95% ethanol. Individual DNA libraries will be prepared using Twist Bio 96-plex prep kits, then sequenced on an Illumina NovaSeq X Plus. Using the low-coverage whole genome sequences, we will examine seasonal patterns in allele frequency change, and compare these fine scale temporal patterns with the larger latitudinal patterns in allele frequency to determine whether the same alleles driving rapid seasonal adaptation are in play over larger spatial (and longer temporal) scales.

## Misc. Details

```{r temp-record-plot, fig.width=6, fig.height=6}
ggplot(temp_record, aes(x = minute_passed, y = temp_C, group = factor(run))) + 
  geom_abline(slope = 0.3, intercept = mean(temp_record[temp_record$minute_interval == 0, 8])) + 
  geom_abline(slope = 0.1, intercept = mean(temp_record[temp_record$minute_interval == 0, 8])) + 
  geom_line(linewidth = 0.2, alpha = 0.8) + 
  geom_point(data = full_data, 
             aes(x = time, y = ctmax + 0.4),
             size = 2,
             shape = 25) +
  labs(x = "Time passed (minutes)",
       y = "Temperature (degrees C)",
       fill = "Trial Number") + 
  guides(colour = "none") + 
  theme_matt(base_size = 16) + 
  theme(legend.position = "right")
```

```{r ramp-record-plot, fig.width=6, fig.height=6}
ramp_record2 = ramp_record %>% 
  group_by(run, minute_interval) %>% 
  summarise(mean_ramp = mean(ramp_per_minute)) %>% 
  ungroup()

ggplot(ramp_record2, aes(x = minute_interval, y = mean_ramp)) + 
  geom_hline(yintercept = 0.3) + 
  geom_hline(yintercept = 0.1) + 
  #geom_point() + 
  geom_hex(bins = 30) + 
  ylim(0, 0.35) + 
  labs(y = "Ramp Rate (deg. C / min.)",
       x = "Time into run (minute)") + 
  theme_matt(base_size = 16) 
```

```{r rep-comp, fig.height=12, fig.width=8}
full_data %>% 
  drop_na(replicate) %>%  
  ggplot(aes(x = factor(replicate), y = ctmax, group = site)) + 
  facet_grid(site~season, scales = "free_y") + 
  geom_point(position = position_jitter(width = 0.1, height = 0),
             alpha = 0.4,
             colour = "grey30") + 
  geom_smooth(method = "lm", colour = "black") + 
  labs(x = "Replicate", 
       y = "CTmax") + 
  theme_matt_facets()
```

```{r num-gens-plot, fig.width=10, fig.height=7}
ggplot(haldanes, aes(x = lat, y = gens, colour = site, shape = season)) + 
  geom_hline(yintercept = 0) + 
  geom_point(size = 5) + 
  scale_colour_manual(values = site_cols) + 
  labs(x = "Latitude", 
       y = "Generations between \ncollections") +
  scale_y_continuous(breaks = seq(from = 0, to = 21, by = 5)) + 
  theme_matt() + 
  theme(legend.position = "right")
```

```{r rank-sims, fig.width=18, fig.height=8}
obs_ranks = ggplot(full_data, aes(x = rank)) + 
  facet_wrap(tube~.) + 
  geom_histogram(binwidth = 1) + 
  scale_x_continuous(breaks = c(2,4,6,8,10)) + 
  ggtitle("Observation") + 
  theme_matt_facets()

sim_data = data.frame()
for(i in 1:max(full_data$run)){
  rep_data = data.frame("tube" = sample(c(1:10), size = 10, replace = F), 
                        "rank" = c(1:10),
                        "rep" = i) %>% 
    arrange(tube)
  
  sim_data = bind_rows(sim_data, rep_data)
  
}

sim_ranks = ggplot(sim_data, aes(x = rank)) + 
  facet_wrap(tube~.) + 
  geom_histogram(binwidth = 1) + 
  scale_x_continuous(breaks = c(2,4,6,8,10)) + 
  ggtitle("Simulation") + 
  theme_matt_facets()


ggarrange(obs_ranks, sim_ranks)
```

